<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-13-300</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Single-base resolution maps of cultivated and wild rice methylomes and regulatory roles of DNA methylation in plant gene expression</p>
         </title>
         <aug>
            <au id="A1"><snm>Li</snm><fnm>Xin</fnm><insr iid="I1"/><insr iid="I2"/><email>lixin@mail.kiz.ac.cn</email></au>
            <au id="A2"><snm>Zhu</snm><fnm>Jingde</fnm><insr iid="I3"/><insr iid="I4"/><email>zhujingde@gmail.com</email></au>
            <au id="A3"><snm>Hu</snm><fnm>Fengyi</fnm><insr iid="I5"/><email>hfengyiyaas@yahoo.com.cn</email></au>
            <au id="A4"><snm>Ge</snm><fnm>Song</fnm><insr iid="I6"/><email>gesong@ibcas.ac.cn</email></au>
            <au id="A5"><snm>Ye</snm><fnm>Mingzhi</fnm><insr iid="I2"/><email>yemz@genomics.org.cn</email></au>
            <au id="A6"><snm>Xiang</snm><fnm>Hui</fnm><insr iid="I1"/><email>xiangh@mail.kiz.ac.cn</email></au>
            <au id="A7"><snm>Zhang</snm><fnm>Guojie</fnm><insr iid="I1"/><insr iid="I2"/><email>zhanggj@genomics.org.cn</email></au>
            <au id="A8"><snm>Zheng</snm><fnm>Xiaoming</fnm><insr iid="I6"/><email>zhengxm@ibcas.ac.cn</email></au>
            <au id="A9"><snm>Zhang</snm><fnm>Hongyu</fnm><insr iid="I3"/><email>possetcn@163.com</email></au>
            <au id="A10"><snm>Zhang</snm><fnm>Shilai</fnm><insr iid="I5"/><email>zsl1192005@163.com</email></au>
            <au id="A11"><snm>Li</snm><fnm>Qiong</fnm><insr iid="I5"/><email>liqiong1983@126.com</email></au>
            <au id="A12"><snm>Luo</snm><fnm>Ruibang</fnm><insr iid="I2"/><insr iid="I7"/><email>luorb@genomics.org.cn</email></au>
            <au id="A13"><snm>Yu</snm><fnm>Chang</fnm><insr iid="I2"/><email>yuch@genomics.org.cn</email></au>
            <au id="A14"><snm>Yu</snm><fnm>Jian</fnm><insr iid="I3"/><email>gyujian@163.com</email></au>
            <au id="A15"><snm>Sun</snm><fnm>Jingfeng</fnm><insr iid="I3"/><email>sunjinfengshci@163.com</email></au>
            <au id="A16"><snm>Zou</snm><fnm>Xiaoyu</fnm><insr iid="I3"/><email>zouxy2001@163.com</email></au>
            <au id="A17"><snm>Cao</snm><fnm>Xiaofeng</fnm><insr iid="I8"/><email>xfcao808@gmail.com</email></au>
            <au id="A18" ca="yes"><snm>Xie</snm><fnm>Xianfa</fnm><insr iid="I9"/><email>xxie@vsu.edu</email></au>
            <au id="A19" ca="yes"><snm>Wang</snm><fnm>Jun</fnm><insr iid="I2"/><insr iid="I10"/><email>wangj@genomics.org.cn</email></au>
            <au id="A20" ca="yes"><snm>Wang</snm><fnm>Wen</fnm><insr iid="I1"/><email>wwang@mail.kiz.ac.cn</email></au>
         </aug>
         <insg>
            <ins id="I1"><p>CAS-Max Planck Junior Research Group, State Key Laboratory of Genetic Resources and Evolution, Kunming Institute of Zoology, Chinese Academy of Sciences, Kunming, 650223, China</p></ins>
            <ins id="I2"><p>BGI-Shenzhen, Shenzhen, 518083, China</p></ins>
            <ins id="I3"><p>Shanghai Cancer Institute, Renji Hospital affiliated to School of Medicine, Shanghai Jiaotong University, LN 2200/25, Xietu Road, Shanghai, 200032, China</p></ins>
            <ins id="I4"><p>Center for Basic and Translational Epigenetic Research of Diseases, School of Life Science, Anhui Medical University, Hefei, 230032, China</p></ins>
            <ins id="I5"><p>Food Crops Research Institute, Yunnan Academy of Agricultural Sciences, Kunming, 650205, China</p></ins>
            <ins id="I6"><p>State Key Laboratory of Systematic and Evolutionary Botany, Institute of Botany, Chinese Academy of Sciences (CAS), Beijing, 100093, China</p></ins>
            <ins id="I7"><p>School of Bioscience and Biotechnology, South China University of Technology, Guangzhou, 510641, China</p></ins>
            <ins id="I8"><p>The State Key Laboratory of Plant Genomics, National Center for Plant Gene Research, Institute of Genetics and Developmental Biology, Chinese Academy of Sciences, Beijing, 100101, China</p></ins>
            <ins id="I9"><p>Department of Biology, Virginia State University, Petersburg, VA, 23806, USA</p></ins>
            <ins id="I10"><p>Department of Biology, University of Copenhagen, Copenhagen, DK-2200, Denmark</p></ins>
         </insg>
         <source>BMC Genomics</source>
         <section><title><p>Plant genomics</p></title></section>
         <issn>1471-2164</issn>
         <pubdate>2012</pubdate>
         <volume>13</volume>
         <issue>1</issue>
         <fpage>300</fpage>
         <url>http://www.biomedcentral.com/1471-2164/13/300</url>
         <xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2164-13-300</pubid><pubid idtype="pmpid">22747568</pubid></pubidlist></xrefbib>
      </bibl>
      <history><rec><date><day>18</day><month>10</month><year>2011</year></date></rec><acc><date><day>29</day><month>5</month><year>2012</year></date></acc><pub><date><day>2</day><month>7</month><year>2012</year></date></pub></history>
      <cpyrt><year>2012</year><collab>Li et al.; licensee BioMed Central Ltd.</collab><note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note></cpyrt>
      <kwdg>
         <kwd>Cultivated and wild rice</kwd>
         <kwd>Methylomes</kwd>
         <kwd>Transcriptional termination regions (TTRs)</kwd>
         <kwd>Gene expression</kwd>
      </kwdg>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>DNA methylation plays important biological roles in plants and animals. To examine the rice genomic methylation landscape and assess its functional significance, we generated single-base resolution DNA methylome maps for Asian cultivated rice <it>Oryza sativa</it> ssp<it>. japonica</it>, <it>indica</it> and their wild relatives, <it>Oryza rufipogon</it> and <it>Oryza nivara</it>.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The overall methylation level of rice genomes is four times higher than that of <it>Arabidopsis</it>. Consistent with the results reported for <it>Arabidopsis</it>, methylation in promoters represses gene expression while gene-body methylation generally appears to be positively associated with gene expression<b>.</b> Interestingly, we discovered that methylation in gene transcriptional termination regions (TTRs) can significantly repress gene expression, and the effect is even stronger than that of promoter methylation. Through integrated analysis of genomic, DNA methylomic and transcriptomic differences between cultivated and wild rice, we found that primary DNA sequence divergence is the major determinant of methylational differences at the whole genome level, but DNA methylational difference alone can only account for limited gene expression variation between the cultivated and wild rice. Furthermore, we identified a number of genes with significant difference in methylation level between the wild and cultivated rice.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>The single-base resolution methylomes of rice obtained in this study have not only broadened our understanding of the mechanism and function of DNA methylation in plant genomes, but also provided valuable data for future studies of rice epigenetics and the epigenetic differentiation between wild and cultivated rice.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>DNA methylation is an epigenetic modification mechanism that plays essential roles in diverse biological processes <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. It has also been proposed to be an alternative inheritance system playing an important role in evolution <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>, as many case studies in plants and animals have revealed that differentially methylated alleles could create heritable phenotypic changes across generations <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>, including some agronomically important traits in rice <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. Recently, single-base resolution methylome maps of a dicot plant (<it>Arabidopsis thaliana</it>), human and silkworm have been successfully generated by whole-genome sequencing bisulfite-treated genomic DNA using next-generation sequencing technology (BS-Seq), which revealed more elaborate patterns and functional effects of DNA methylation at the whole-genome level <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr></abbrgrp>.</p>
         <p>Rice is not only one of the most important crops as the primary food source for more than half of the world&#8217;s population, but also an important model system for the evolutionary study of cereals and the molecular study of monocot plants. DNA methylation serves various important functions and thus has been of great interest to rice geneticists and breeders. Pioneer studies of epigenetic modifications in rice, including DNA and histone methylation, using traditional methylated DNA enrichment method suggested possible functional roles of DNA methylation in rice <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr></abbrgrp>, but this approach is difficult to discriminate major genomic elements including promoters, gene bodies, transposons, and repeats. Recently two other studies comparing methylation patterns among many species using BS-Seq technology briefly reported genome methylation patterns for <it>japonica</it> rice strain <it>Nipponbare</it><abbrgrp><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>. However, the two <it>Nipponbare</it> methylomes had relatively low sequencing coverage (&lt; 4&#215; per base for each strand). Furthermore, one of the studies <abbrgrp><abbr bid="B18">18</abbr></abbrgrp> used different tissues to obtain methylomic (from leaves) and transcriptomic (from shoots) profiles and the other did not obtain gene expression data at all, which made it difficult to accurately analyze the regulatory effects of DNA methylation in rice. As acknowledged by Feng et al. <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>, such a low genome-wide sequencing depth permitted good assessment of the level of methylation of major genomic elements including genes, transposons, and repeats, but was not sufficient for quantifing the methylation level at individual cytosines. Furthermore, to what extent and how the cultivated rice has evolved divergent DNA methylation pattern from its wild relative species still need to be addressed.</p>
         <p>In this study, we generated single-base-resolution DNA methylomic maps as well as transcriptomic profiles for young panicles of the two Asian cultivated rice subspecies, <it>Oryza sativa</it> ssp<it>. japonica</it> and <it>O. sativa</it> ssp<it>. indica</it>, and their wild relatives, <it>Oryza rufipogon</it> and <it>Oryza nivara</it>. The panicle is an important organ showing strong differentiation between cultivated and wild rice and directly affects the major yield components including the number of spikelets and the percentage of filled grains <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. The high-resolution DNA methylomes of cultivated and domestic rice will not only serve as references for future molecular studies of rice epigenetics but also shed new lights into epigenetic mechanisms of plant domestication.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussions</p>
         </st>
         <sec>
            <st>
               <p>Methylation landscapes in rice</p>
            </st>
            <p>To investigate the general methylation patterns of rice as well as the DNA methylation divergence between cultivated and wild rice, we included in our samples both subspecies of Asian cultivated rice, <it>Oryza sativa</it> spp. <it>japonica</it> (represented by Dianjingyou1, bred by the Yunnan Academy of Agricultural Sciences, China, which is a typical <it>japonica</it> rice type mainly suitable to be planted in Yunnan) and <it>indica</it> (IR64, from the International Rice Research Institute, IRRI), and their wild relatives, <it>Oryza rufipogon</it> (Accession 105327, originally collected from Sri Lanka and provided by IRRI) and <it>Oryza nivara</it> (Accession 105426, originally collected from India and provided by IRRI).</p>
            <p>For each of the four rice lines, a young panicle was used to generate a methylomic map with the BS-Seq method. 170&#8211;320 million sequencing reads were generated for each of the four samples, respectively. After removing low-quality and clonal reads (artificially generated during amplification of bisulfate-treated DNA in constructing sequencing libraries, see Material and methods for details), 58&#8211;176 million uniquely mapped high-quality reads were retained for each of the four rice lines, yielding 2.6-9.2 gigabases (Gb) of data which cover 76-91% of the reference Nipponbare genome (International Rice Genome Sequencing Project, 2005), respectively (Table <tblr tid="T1">1</tblr>). The read depths range from 4.5&#215; to 13.5&#215; per base for each DNA strand (Table <tblr tid="T1">1</tblr>). Because <it>japonica</it> has the best reference genome and we obtained the highest genome coverage and sequencing depth for the <it>japonica</it> strain Dianjingyou1, here we use the <it>japonica</it> accession as the representative to describe the general methylation landscape of rice, with the differences between wild and cultivated rice being discussed later.</p>
            <table id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>
                     <b>Data description of BS-Seq reads for the four rice samples</b>
                  </p>
               </caption>
               <tgroup align="left" cols="5">
                  <colspec align="left" colname="c1" colnum="1" colwidth="1*"/>
                  <colspec align="left" colname="c2" colnum="2" colwidth="1*"/>
                  <colspec align="left" colname="c3" colnum="3" colwidth="1*"/>
                  <colspec align="left" colname="c4" colnum="4" colwidth="1*"/>
                  <colspec align="left" colname="c5" colnum="5" colwidth="1*"/>
                  <thead valign="top">
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>Sample</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>
                              <b>
                                 <it>Japonica</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c3">
                           <p>
                              <b>
                                 <it>Indica</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c4">
                           <p>
                              <b>
                                 <it>O. rufipogon</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c5">
                           <p>
                              <b>
                                 <it>O. nivara</it>
                              </b>
                           </p>
                        </entry>
                     </row>
                  </thead>
                  <tbody valign="top">
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Raw reads number/data production (Gb)</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>320,730,854/16.2</p>
                        </entry>
                        <entry colname="c3">
                           <p>170,784,798/7.5</p>
                        </entry>
                        <entry colname="c4">
                           <p>171,346,432/7.5</p>
                        </entry>
                        <entry colname="c5">
                           <p>203,796,688/9.0</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Effective reads number/data production (Gb)</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>175,749,760/9.2</p>
                        </entry>
                        <entry colname="c3">
                           <p>58,423,521/2.6</p>
                        </entry>
                        <entry colname="c4">
                           <p>68,773,618/3.0</p>
                        </entry>
                        <entry colname="c5">
                           <p>81,784,095/3.6</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Genome coverage</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>91%</p>
                        </entry>
                        <entry colname="c3">
                           <p>76%</p>
                        </entry>
                        <entry colname="c4">
                           <p>78%</p>
                        </entry>
                        <entry colname="c5">
                           <p>77%</p>
                        </entry>
                     </row>
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>Average read depth per base per strand</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>13.5 &#215;</p>
                        </entry>
                        <entry colname="c3">
                           <p>4.54 &#215;</p>
                        </entry>
                        <entry colname="c4">
                           <p>5.17 &#215;</p>
                        </entry>
                        <entry colname="c5">
                           <p>6.25&#215;</p>
                        </entry>
                     </row>
                  </tbody>
               </tgroup>
            </table>
            <p>We used the unmethylated chloroplast genome <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> to calculate the sum of non-conversion rate and T-C sequencing error rate, which is as low as 0.47% to 1.17% for the four samples respectively (Table <tblr tid="T2">2</tblr>). Using these values we then conducted binomial tests with false positive rate below 5% to exclude those mCs that may be the results of non-conversion of cytosines during our bisulfite treatment or T to C sequencing errors during the base calling process. After this correction, we identified 35,598,491 methylated cytosines (mCs) accounting for 24.3% of all covered cytosines throughout the reference genome in the <it>japonica</it> Dianjingyou1 (Table <tblr tid="T2">2</tblr>), which is four times higher than that of <it>Arabidopsis</it><abbrgrp><abbr bid="B13">13</abbr></abbrgrp> in terms of mC density. The percentages of mCs in CG, CHG (with H being A, C or T) and CHH contexts are 54.7%, 37.3% and 12.0%, respectively while the average methylation level in the three contexts are 44.5%, 24.1% and 4.7%, respectively, with methylation level being defined as the proportion of reads showing mC among all reads covering the same cytosine site. Both of these measures reveal that rice has much higher level of genome-wide DNA methylation than <it>A. thaliana</it><abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr></abbrgrp> (Table <tblr tid="T2">2</tblr>). These patterns are more or less the same in <it>indica</it> and the two wild rice species (Table <tblr tid="T2">2</tblr>), and are consistent with the two previous studies of rice leaf methylomes <abbrgrp><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>.</p>
            <table id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>
                     <b>Conversion rate and methylation pattern for the four rice samples</b>
                  </p>
               </caption>
               <tgroup align="left" cols="7">
                  <colspec align="left" colname="c1" colnum="1" colwidth="1*"/>
                  <colspec align="left" colname="c2" colnum="2" colwidth="1*"/>
                  <colspec align="left" colname="c3" colnum="3" colwidth="1*"/>
                  <colspec align="left" colname="c4" colnum="4" colwidth="1*"/>
                  <colspec align="left" colname="c5" colnum="5" colwidth="1*"/>
                  <colspec align="left" colname="c6" colnum="6" colwidth="1*"/>
                  <colspec align="left" colname="c7" colnum="7" colwidth="1*"/>
                  <thead valign="top">
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>Sample</b>
                           </p>
                        </entry>
                        <entry colname="c2" nameend="c4" namest="c2">
                           <p>
                              <b>Japonica</b>
                           </p>
                        </entry>
                        <entry colname="c5" nameend="c7" namest="c5">
                           <p>
                              <b>Indica</b>
                           </p>
                        </entry>
                     </row>
                  </thead>
                  <tfoot>
                     <p>* The sum of non-conversion rate and T-C sequencing error rate.</p>
                  </tfoot>
                  <tbody valign="top">
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>error rate</b>
                              <sup>
                                 <b>*</b>
                              </sup>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>
                              <b>1.12%</b>
                           </p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Methylation</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>Methylcytosine number</p>
                        </entry>
                        <entry colname="c3">
                           <p>Methylation density</p>
                        </entry>
                        <entry colname="c4">
                           <p>Average methylation level of all cytosines</p>
                        </entry>
                        <entry colname="c5">
                           <p>Methylcytosine number</p>
                        </entry>
                        <entry colname="c6">
                           <p>Methylation density</p>
                        </entry>
                        <entry colname="c7">
                           <p>Average methylation level of all cytosines</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Total</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>35,598,491</p>
                        </entry>
                        <entry colname="c3">
                           <p>24.27%</p>
                        </entry>
                        <entry colname="c4">
                           <p>15.40%</p>
                        </entry>
                        <entry colname="c5">
                           <p>22,559,747</p>
                        </entry>
                        <entry colname="c6">
                           <p>18.85%</p>
                        </entry>
                        <entry colname="c7">
                           <p>9.81%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>14,989,765</p>
                        </entry>
                        <entry colname="c3">
                           <p>54.68%</p>
                        </entry>
                        <entry colname="c4">
                           <p>44.46%</p>
                        </entry>
                        <entry colname="c5">
                           <p>9,881,382</p>
                        </entry>
                        <entry colname="c6">
                           <p>45.17%</p>
                        </entry>
                        <entry colname="c7">
                           <p>27.77%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>9,238,307</p>
                        </entry>
                        <entry colname="c3">
                           <p>37.31%</p>
                        </entry>
                        <entry colname="c4">
                           <p>20.14%</p>
                        </entry>
                        <entry colname="c5">
                           <p>5,553,755</p>
                        </entry>
                        <entry colname="c6">
                           <p>27.29%</p>
                        </entry>
                        <entry colname="c7">
                           <p>13.48%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHH</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>11,370,419</p>
                        </entry>
                        <entry colname="c3">
                           <p>12.03%</p>
                        </entry>
                        <entry colname="c4">
                           <p>4.02%</p>
                        </entry>
                        <entry colname="c5">
                           <p>7,124,610</p>
                        </entry>
                        <entry colname="c6">
                           <p>9.20%</p>
                        </entry>
                        <entry colname="c7">
                           <p>3.16%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Sample</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>
                              <b>
                                 <it>O. rufipogon</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c3"/>
                        <entry colname="c4"/>
                        <entry colname="c5">
                           <p>
                              <b>
                                 <it>O. nivara</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>error rate</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>0.47%</p>
                        </entry>
                        <entry colname="c3"/>
                        <entry colname="c4"/>
                        <entry colname="c5">
                           <p>0.94%</p>
                        </entry>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Methylation</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>Methylcytosine number</p>
                        </entry>
                        <entry colname="c3">
                           <p>Methylation density</p>
                        </entry>
                        <entry colname="c4">
                           <p>Average methylation level of all cytosines</p>
                        </entry>
                        <entry colname="c5">
                           <p>Methylcytosine number</p>
                        </entry>
                        <entry colname="c6">
                           <p>Methylation density</p>
                        </entry>
                        <entry colname="c7">
                           <p>Average methylation level of all cytosines</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Total</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>23,358,199</p>
                        </entry>
                        <entry colname="c3">
                           <p>18.95%</p>
                        </entry>
                        <entry colname="c4">
                           <p>9.05%</p>
                        </entry>
                        <entry colname="c5">
                           <p>24,308,799</p>
                        </entry>
                        <entry colname="c6">
                           <p>20.75%</p>
                        </entry>
                        <entry colname="c7">
                           <p>13.79%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>10,333,979</p>
                        </entry>
                        <entry colname="c3">
                           <p>46.75%</p>
                        </entry>
                        <entry colname="c4">
                           <p>30.82%</p>
                        </entry>
                        <entry colname="c5">
                           <p>9,991,032</p>
                        </entry>
                        <entry colname="c6">
                           <p>49.63%</p>
                        </entry>
                        <entry colname="c7">
                           <p>45.46%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>5,785,271</p>
                        </entry>
                        <entry colname="c3">
                           <p>27.89%</p>
                        </entry>
                        <entry colname="c4">
                           <p>12.74%</p>
                        </entry>
                        <entry colname="c5">
                           <p>5,735,875</p>
                        </entry>
                        <entry colname="c6">
                           <p>29.46%</p>
                        </entry>
                        <entry colname="c7">
                           <p>19.18%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHH</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>7,238,949</p>
                        </entry>
                        <entry colname="c3">
                           <p>9.00%</p>
                        </entry>
                        <entry colname="c4">
                           <p>2.75%</p>
                        </entry>
                        <entry colname="c5">
                           <p>8,581,892</p>
                        </entry>
                        <entry colname="c6">
                           <p>11.07%</p>
                        </entry>
                        <entry colname="c7">
                           <p>5.75%</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Sample</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>
                              <b>
                                 <it>Arabidopsis</it>
                              </b>
                              <abbrgrp>
                                 <abbr bid="B12">12</abbr>
                                 <abbr bid="B13">13</abbr>
                              </abbrgrp>
                           </p>
                        </entry>
                        <entry colname="c3"/>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>error rate</b>
                           </p>
                        </entry>
                        <entry colname="c2"/>
                        <entry colname="c3"/>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Methylation</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>Methylation density</p>
                        </entry>
                        <entry colname="c3">
                           <p>Average methylation level of all cytosines</p>
                        </entry>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Total</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>5.26%</p>
                        </entry>
                        <entry colname="c3">
                           <p>NA</p>
                        </entry>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>NA</p>
                        </entry>
                        <entry colname="c3">
                           <p>24.00%</p>
                        </entry>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>NA</p>
                        </entry>
                        <entry colname="c3">
                           <p>6.70%</p>
                        </entry>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>CHH</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>NA</p>
                        </entry>
                        <entry colname="c3">
                           <p>1.70%</p>
                        </entry>
                        <entry colname="c4"/>
                        <entry colname="c5"/>
                        <entry colname="c6"/>
                        <entry colname="c7"/>
                     </row>
                  </tbody>
               </tgroup>
            </table>
            <p>The genome-wide methylation patterns with respect to the genomic structure in rice young panicles are similar to those observed in <it>A. thaliana</it><abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B22">22</abbr></abbrgrp> and in rice leaves <abbrgrp><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>, particularly in the relative prevalence of mCs in the contexts of GG, CHG, and CHH (Figure <figr fid="F1">1</figr>a), the tendency toward hypermethylation in CG context but hypomethylation in CHH (Figure <figr fid="F1">1</figr>b), the high methylation level in transposable elements (TEs) and the relatively low level of methylation in genic regions, the enrichment of CG methylation in gene bodies (Figure <figr fid="F2">2</figr>a-f), and the enrichment of small RNA loci in TEs and depletion in genic regions (Figure <figr fid="F2">2</figr>g and <figr fid="F2">2</figr>h).</p>
            <fig id="F1"><title><p>Figure 1</p></title><caption><p>DNA methylation pattern in the <it>japonica</it> rice (Dianjingyou1)</p></caption><text>
   <p><b>DNA methylation pattern in the </b><b><it>japonica</it></b><b> rice (Dianjingyou1). (a)</b> Relative proportions of mCs in three sequence contexts. <b>(b)</b> Distribution of methylation level of mCs in each sequence context. Only mCs covered by at least 5 reads were used to calculate methylation level. Methylation level on the x-axis was defined as the percentage of reads showing methylated cytosine at a reference cytosine site. The y-axis indicates the fraction of total mCs calculated within bins of 10%.</p>
</text><graphic file="1471-2164-13-300-1"/></fig>
            <fig id="F2"><title><p>Figure 2</p></title><caption><p>DNA methylation patterns in different genomic regions</p></caption><text>
   <p><b>DNA methylation patterns in different genomic regions.</b> Methylation patterns were characterized in following functional regions: TEs, small RNA (smRNA) loci, and genic regions including the promoter (200&#8201;bp upstream of the transcriptional start site, TSS), gene body (the entire transcribed region), and the transcriptional termination region (TTR, 200&#8201;bp downstream of transcriptional termination site). Gene body is further divided into untranslated regions (UTRs), coding regions (CDs), and introns. Methylation level, TE density and smRNA locus density were calculated across TE, gene body and their flanking sequences using an overlapping sliding window of 5% of the sequence length at a step of 2.5% of the sequence length. <b>(a)</b> Fraction of total mCs in each sequence context for different genomic regions. <b>(b)</b> Relative methylation level (total methylation level of mCs divided by sequence length of the calculated region) in each sequence context for different genomic regions. Distributions of absolute methylation level (total methylation level of mCs divided by total number of cytosine sites in the calculated region) <b>(c)</b> and relative methylation level <b>(d)</b> in gene body and 2-kb flanking sequences on both sides. Absolute <b>(e)</b> and relative <b>(f)</b> methylation level distributions in TE and 0.5-kb flanking sequences on both sides. <b>(g)</b> TE and smRNA density distributions in gene body and 2-kb flanking sequences. <b>(h)</b> smRNA density distribution throughout TE and 0.5&#8201;kb-flanking sequences. Relationships between methylation level and sequence length in genes <b>(i)</b> and TE regions <b>(j)</b>, in which both absolute (top) and relative (bottom) methylation levels were analyzed.</p>
</text><graphic file="1471-2164-13-300-2"/></fig>
         </sec>
         <sec>
            <st>
               <p>Difference of methylation landscapes between rice and <it>A. thaliana</it></p>
            </st>
            <p>However, in contrast to the significantly enriched methylation in all the three sequence contexts around the centromeric regions in <it>A. thaliana</it> genome <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, rice shows much less difference between centromeric and non-centromeric regions with only slight CG and CHG methylation enrichment around the centromeric regions and almost uniform distribution of CHH mCs across entire chromosomes (Figure <figr fid="F3">3</figr>). This is probably due to the fact that compared to <it>A. thaliana</it>, rice has significantly larger amount of pericentromeric heterochromatin <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr></abbrgrp> and much higher proportion of TEs distributed across the genome, both of which are heavily methylated.</p>
            <fig id="F3"><title><p>Figure 3</p></title><caption><p>Distribution of mCs on the sense and antisense strands of rice chromosomes for each sequence context</p></caption><text>
   <p><b>Distribution of mCs on the sense and antisense strands of rice chromosomes for each sequence context.</b> The sliding window size is 50&#8201;kb and the step size is 25&#8201;kb. The black circle indicates the centromeric position of a chromosome. Some centromeric regions of chromosomes have not been completely sequenced and thus are displayed as gaps in the figure.</p>
</text><graphic file="1471-2164-13-300-3"/></fig>
            <p>In addition, we found a positive correlation between sequence length and methylation density for genes (Figure <figr fid="F2">2</figr>i), but not for TEs (Figure <figr fid="F2">2</figr>j), which is different from the case in <it>A. thaliana</it> wherein both genes and TEs showed positive correlation between sequence length and methylation <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. This might be due to the fact that TEs in rice genome are almost saturated with mCs regardless of their length. All the above results are consistently found in all the four rice samples (see Additional files <supplr sid="S1">1</supplr> and <supplr sid="S2">2</supplr> for results of other samples), showing these are general patterns in both cultivated and wild rice. These differences between rice and <it>Arabidopsis</it> suggest that differences in genomic organization and TE composition among plants could result in different epigenomic landscapes.</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Distribution of mCs on the sense and antisense strands of rice chromosomes for each sequence context in other samples (a) indica. (b) O. rufipogon. (c) O. nivara.</b> The sliding window size is 50 kb and the step size is 25 kb. The black circle indicates the centromeric position of a chromosome. Some centromeric regions of chromosomes have not been completely sequenced and thus are displayed as gaps in the figures.</p>
               </text>
               <file name="1471-2164-13-300-S1.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p>
                     <b>Relationships between methylation level and sequence length in genes (left) and TE regions (right) in indica (a), O. rufipogon (b), and O. nivara (c), in which both absolute (top) and relative (bottom) methylation levels were analyzed.</b>
                  </p>
               </text>
               <file name="1471-2164-13-300-S2.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Regulatory roles of promoter and gene-body DNA methylation in gene expression</p>
            </st>
            <p>To assess the effects of rice DNA methylation on gene expression, we also generated genome-wide gene expression profiles for all the four samples (Table <tblr tid="T3">3</tblr>) using Digital Gene Expression tag profiling (DGE) technology, which combines the classic SAGE (Serial Analysis of Gene Expression) with the Illumina sequencing techniques. In total we obtained 7,343,629 to 7,774,577 raw reads with 599,304 to 648,947 unique tag sequences for each of the four samples. After filtration and mapping reads to 24,955 non-redundant full-length cDNAs (FL-cDNAs) of rice, our DGE data cover 79% to 83% of all FL-cDNAs with a one-tag-one-cDNA relationship (Table <tblr tid="T3">3</tblr>).</p>
            <table id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>
                     <b>DGE data description for the four rice samples</b>
                  </p>
               </caption>
               <tgroup align="left" cols="5">
                  <colspec align="left" colname="c1" colnum="1" colwidth="1*"/>
                  <colspec align="left" colname="c2" colnum="2" colwidth="1*"/>
                  <colspec align="left" colname="c3" colnum="3" colwidth="1*"/>
                  <colspec align="left" colname="c4" colnum="4" colwidth="1*"/>
                  <colspec align="left" colname="c5" colnum="5" colwidth="1*"/>
                  <thead valign="top">
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>Sample</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>
                              <b>
                                 <it>Japonica</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c3">
                           <p>
                              <b>
                                 <it>Indica</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c4">
                           <p>
                              <b>
                                 <it>O. rufipogon</it>
                              </b>
                           </p>
                        </entry>
                        <entry colname="c5">
                           <p>
                              <b>
                                 <it>O. nivara</it>
                              </b>
                           </p>
                        </entry>
                     </row>
                  </thead>
                  <tbody valign="top">
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Raw/distinct tag number</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>7,662,276/648,947</p>
                        </entry>
                        <entry colname="c3">
                           <p>7,418,013/562,392</p>
                        </entry>
                        <entry colname="c4">
                           <p>7,774,577/561,691</p>
                        </entry>
                        <entry colname="c5">
                           <p>7,343,629/599,304</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Total/distinct tag number used in analysis</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>7,589,226/612,176</p>
                        </entry>
                        <entry colname="c3">
                           <p>7,413,872/558,498</p>
                        </entry>
                        <entry colname="c4">
                           <p>7,769,442/556,909</p>
                        </entry>
                        <entry colname="c5">
                           <p>7,334,416/591,759</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Genes with CATG sites</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>24,611 (98.62%)</p>
                        </entry>
                        <entry colname="c3">
                           <p>24,611 (98.62%)</p>
                        </entry>
                        <entry colname="c4">
                           <p>24,611 (98.62%)</p>
                        </entry>
                        <entry colname="c5">
                           <p>24,611 (98.62%)</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>Tags with perfect match to unique gene</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>4,729,194</p>
                        </entry>
                        <entry colname="c3">
                           <p>4,295,776</p>
                        </entry>
                        <entry colname="c4">
                           <p>4,579,715</p>
                        </entry>
                        <entry colname="c5">
                           <p>4,162,572</p>
                        </entry>
                     </row>
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>Genes with perfect match to unique tags</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>20,682 (82.88%)</p>
                        </entry>
                        <entry colname="c3">
                           <p>19,804 (79.36%)</p>
                        </entry>
                        <entry colname="c4">
                           <p>20,095 (80.52%)</p>
                        </entry>
                        <entry colname="c5">
                           <p>19,745 (79.12%)</p>
                        </entry>
                     </row>
                  </tbody>
               </tgroup>
            </table>
            <p>Although some previous studies have also explored the relationship between DNA methylation and gene expression in rice <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B18">18</abbr></abbrgrp>, their low resolution of genome-wide methylated cytokines (mCs) <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> or utilization of different tissues in generating transcriptomic and methylomic profiles <abbrgrp><abbr bid="B18">18</abbr></abbrgrp> created the need for more elaborate methylomic studies to comprehensively unveil high resolution rice methylomes and detailed functional effects of rice DNA methylation. Here we shall mainly use the <it>japonica</it> data to present the detailed patterns in rice, which are similar in all four samples (see Additional file <supplr sid="S3">3</supplr> for results of the other three samples).</p>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Relationships between gene expression and methylation in different genic regions for indica (a-b), O. rufipogon (c-d), and O. nivara (e-f).</b> For panel a, c and e, genes are categorized into unmethylated (black line) and methylated ones, and the latter were further divided into five groups based on methylation level (from Group 1 of the 20% of genes with the lowest methylation to Group 5 of the x20% with the highest methylation level). For panel b, d and f, methylation-expression Spearman correlation coefficients along genes and their 2 kb-flanking regions were displayed. The correlation coefficients were calculated using an overlapping sliding window of 5% of sequence length at a step of 2.5% of sequence length.</p>
               </text>
               <file name="1471-2164-13-300-S3.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <p>Our results show that promoter-unmethylated genes have significantly higher expression level than promoter-methylated genes (<it>p</it>&#8201;=&#8201;1.915e-08, Wilcoxon rank sum test), indicating that promoter methylation represses gene expression. Consistent with this conclusion, the repression effect is weak for slightly and moderately promoter-methylated genes while very strong for heavily methylated ones (Figure <figr fid="F4">4</figr>a, and see Additional file <supplr sid="S4">4</supplr> for each sequence context). These results from the high resolution genome-wide data proved false the previous speculation that promoter methylation may not affect rice gene transcription <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> but are consistent with the findings from <it>A. thaliana</it><abbrgrp><abbr bid="B25">25</abbr></abbrgrp>, human <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>, and the recent rice methylome study <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, confirming that promoter methylation is a general mechanism suppressing gene expression in eukaryotes.</p>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p><b>Relationships between gene expression and methylation in different genic regions and sequence contexts.</b>(a) Promoter methylation. (b) TTR methylation. (c) Gene body methylation. Methylation was measured using absolute methylation level (total methylation level of mCs divided by sequence length of the calculated region). Genes are categorized into unmethylated (black line) and methylated ones, and the latter were further divided into five groups based on methylation level (from Group 1 of the 20% of genes with the lowest methylation to Group 5 of the 20% with the highest methylation level). Gene expression level was measured by log2 value of its tag number and is indicated on the x axis. The fraction for each group of methylated and unmethylated genes is shown on the y-axis.</p>
               </text>
               <file name="1471-2164-13-300-S4.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <fig id="F4"><title><p>Figure 4</p></title><caption><p>Relationship between methylation level and gene expression in different genic regions</p></caption><text>
   <p><b>Relationship between methylation level and gene expression in different genic regions. (a)</b> Promoter; <b>(b)</b> Gene body; <b>(c)</b> TTR. Methylation level was measured using the absolute methylation level but similar results were also obtained using the relative methylation level. Genes are categorized into unmethylated (black line) and methylated ones, the latter of which were further divided into five groups based on the absolute methylation level (from Group 1 of the 20% of genes with the lowest methylation level to Group 5 of the 20% with the highest methylation level). For clarity, we only display 1st, 3rd and 5th groups. Methylation-expression Spearman correlation coefficients along genes and their 2&#8201;kb-flanking regions in rice <b>(d)</b> and <it>Arabidopsis</it><b>(e)</b>. The methylation-expression Spearman correlation coefficients were also calculated in TTR and promoter regions using genes without TTR methylation (left to the dashed line) and genes without promoter methylation (right to the dashed line) respectively. Methylation was measured using absolute methylation level <b>(f)</b> or relative methylation level <b>(g)</b>. The correlation coefficients were calculated using an overlapping sliding window of 5% of sequence length at a step of 2.5% of sequence length.</p>
</text><graphic file="1471-2164-13-300-4"/></fig>
            <p>In contrast to promoter methylation, gene-body methylation generally appears to be positively correlated to gene expression as body-methylated genes have significantly higher expression level than body-unmethylated genes (<it>p</it>&#8201;&lt;&#8201;2.2e-16, Wilcoxon rank sum test). However, further analysis revealed complicated relationships between gene-body methylation and gene expression. At first gene expression levels increase with methylation levels, but after a certain point, heavy gene-body methylation appears to repress gene expression; and consequently genes with moderate levels of body methylation tend to have the highest expression levels (Figure <figr fid="F4">4</figr>b, see Additional file <supplr sid="S4">4</supplr> for each sequence context). These observations are consistent with previous studies in <it>A. thaliana</it><abbrgrp><abbr bid="B25">25</abbr><abbr bid="B27">27</abbr></abbrgrp> and in rice <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. It has been proposed that gene-body methylation can prevent transcriptional initiation from cryptic sites within genes but at the cost of impeding transcriptional elongation <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. This trade-off may have led to the observation that moderately body-methylated genes have the highest level of expression.</p>
         </sec>
         <sec>
            <st>
               <p>Methylation in transcriptional termination region (TTR) can significantly repress gene expression</p>
            </st>
            <p>Most interestingly, our study revealed that methylation in the transcriptional termination region (TTR) is also highly correlated with gene expression. In a pattern similar to promoter methylation, the TTR-unmethylated genes are expressed at significantly higher level than TTR-methylated genes (<it>p</it>&#8201;&lt;&#8201;2.2e-16, Wilcoxon rank sum test). Moreover, an approximately monotonic negative correlation exists between TTR methylation and gene expression (Figure <figr fid="F4">4</figr>c, see Additional file <supplr sid="S4">4</supplr> for each sequence context). Surprisingly, the correlation coefficient is even higher than that of promoters, especially for CG methylation (Figure <figr fid="F4">4</figr>d), suggesting that TTR methylation may play an even more important role in gene expression regulation than promoter methylation. To exclude the possibility that the negative correlation between TTR methylation and gene expression is an indirect effect caused by promoter methylation if promoter-methylated genes are also prone to have methylated TTRs, we repeated the correlation analysis for both TTR and promoter regions using genes without promoter methylation and those without TTR methylation respectively. The strong negative correlation between TTR methylation and gene expression and the higher correlation coefficients than that for promoter methylation could still be observed (Figure <figr fid="F4">4</figr>f and <figr fid="F4">4</figr> g).</p>
            <p>DNA methylation, together with associated histone modification, has been suggested to influence the binding of RNA polymerase to DNA and thus affect the initiation, elongation and termination of the gene transcription process <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. It has been established that promoter methylation can repress gene expression and promoter hypomethylation may be required for genes to express efficiently <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B25">25</abbr></abbrgrp>. Gene-body methylation has also been proposed to inhibit transcriptional noise in actively transcribed genes and consequently body-methylated genes usually show moderate to high level of expression <abbrgrp><abbr bid="B22">22</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>. It is plausible that TTR methylation could have significant effect on gene expression through interfering with transcriptional termination. Consistent with this hypothesis, active DNA demethylation mediated by the DEMETER (DME) family has been found primarily at both the 5&#8217;- and 3&#8217;- ends of genes in <it>A. thaliana</it>, suggesting a functional role of methylation in both regions <abbrgrp><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>.</p>
            <p>To further investigate whether such a regulatory mechanism is shared by plants, we also examined the effects of TTR methylation on gene expression in <it>Arabidopsis</it> using existing data <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. Consistent with the results from rice, our analysis revealed significant negative correlation between TTR methylation and gene expression in <it>Arabidopsis</it> (Figure <figr fid="F4">4</figr>e), suggesting a general regulatory role of TTR methylation both in monocot and dicot plants.</p>
            <p>In addition, we found that the 5&#8217;-end of gene coding region is another important regulatory region showing significant positive correlation between its methylation and gene expression in <it>Arabidopsis</it>, but not in rice (Figure <figr fid="F4">4</figr>d and <figr fid="F4">4</figr>e), consistent with the <it>Arabidopsis</it>-specific CHH methylation enrichment in this region. Whether this is a dicot-specific regulation mechanism needs further studies using more plant species of both monocots and dicots. It is worth noting that the positive correlation between the 5&#8217;-end gene coding region methylation and gene expression in <it>Arabidopsis</it> could be revealed based on both the absolute (total methylation level of mCs divided by sequence length) and the relative (total methylation level of mCs divided by total number of cytosine sites in a region) methylation levels, but the correspondent CHH methylation enrichment in <it>Arabidopsis</it> could only be revealed using the absolute methylation level (Additional file <supplr sid="S5">5</supplr>). This may explain the failure of previous studies on <it>Arabidopsis</it> to reveal the positive effect of 5&#8217;-end gene methylation on gene expression and suggests absolute methylation level may be better than relative methylation level to affect gene expression.</p>
            <suppl id="S5">
               <title>
                  <p>Additional file 5</p>
               </title>
               <text>
                  <p><b>Methylation level distributions in gene body and 2-kb flanking sequences in Arabidopsis.</b> Absolute (a) and relative (b) methylation level distributions in gene body and 2-kb flanking sequences in Arabidopsis. Methylation levels along gene body and their 2 kb-flanking regions were calculated using an overlapping sliding window of 5% of sequence length at a step of 2.5% of sequence length. The related raw data for Arabidopsis were downloaded from <url>http://www.ncbi.nlm.nih.gov/sra</url>(SRA000284</p>
               </text>
               <file name="1471-2164-13-300-S5.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Methylome comparison between wild and cultivated rice</p>
            </st>
            <p>To examine the divergence between cultivated and wild rice at genetic, methylation and gene expression levels, we first constructed trees based on genomic, methylomic, and gene expression data, respectively (see Materials and methods) (Figure <figr fid="F5">5</figr>a-c). The genomic DNA tree shows the same topology with the methylation-based trees except for the one constructed using CHH mCs. The consistency between the genomic and methylomic trees suggests that genetic divergence at DNA sequence level may be the major determinant of methylation patterns in the genome. We further examined the relationship between genetic and methylation divergence among samples using sliding windows across the whole genome. The average number of nucleotide differences per site and the average Spearman correlation coefficient of mCs were used to measure genetic and methylation divergence among samples, respectively (see Materials and methods). Through sliding window analysis, we found that regions with high genetic sequence divergence also have high CG methylation divergence (low correlation coefficient) among samples (Figure <figr fid="F6">6</figr>). However, this pattern was not obvious for non-CG methylation, especially CHG methylation. Taken together, these results suggested that genetic divergence may be the major determinant of CG methylation patterns which usually showed high methylation levels, while non-CG methylation level is usually low and may be easily affected by other internal/external factors besides the DNA sequence.</p>
            <fig id="F5"><title><p>Figure 5</p></title><caption><p>Cluster analyses based on genome-wide cytosine methylation, SNPs and gene expression profiles of the four rice samples</p></caption><text>
   <p><b>Cluster analyses based on genome-wide cytosine methylation, SNPs and gene expression profiles of the four rice samples. (a)</b> Methylation tree for each sequence context. <b>(b)</b> Genomic tree based on SNPs. <b>(c)</b> Expression tree. Methylation and expression trees were constructed using the distances of correlation coefficients (<it>r</it>) of whole-genome methylation and expression profiles, respectively, among the samples. (<b>d</b>) Relationship between methylation level and their variation among species. The x-axis indicates the log<sub>2</sub> transformed methylation level of each sliding-window, and y-axis indicates the log<sub>2</sub> transformed CV of corresponding region among four samples.</p>
</text><graphic file="1471-2164-13-300-5"/></fig>
            <fig id="F6"><title><p>Figure 6</p></title><caption><p>Relationship between genetic and methylation divergence in each sequence contexts</p></caption><text>
   <p><b>Relationship between genetic and methylation divergence in each sequence contexts.</b> The average number of nucleotide differences per site (indicated by x-axis) and average Spearman correlation coefficients (<it>r</it>) of methylation level of all cytosines among samples (indicated by y-axis) were calculated for each 50-kb sliding window with a step of 25&#8201;kb across the whole genome. Then all sliding windows were classified into 20 groups with equal numbers (657 sliding windows) according to their <it>&#960;</it> values from the lowest to the highest. The average number of nucleotide differences per site and <it>r</it> of each group were calculated and their values were plotted. Because most sliding windows have relatively small values of average number of nucleotide differences per site, the data points in the figure were enriched in the left.</p>
</text><graphic file="1471-2164-13-300-6"/></fig>
            <p>However, the topology of the gene expression tree is different from both genomic DNA and methylation-based trees, with the two cultivated rice subspecies tightly clustering together and the two wild rice species being most similar to each other, a pattern consistent with the phenotypic relationships among the four samples. The genome-wide gene expression divergence of panicles among the four rice subspecies/species obviously departs from the expectation under the neutral evolution model that posits that gene expression differentiation positively correlates with species&#8217; genetic divergence <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. Instead, it suggests rice domestication may have occurred through changes in a limited number of genes that have pleiotropic and/or cascading effects on gene expression at the whole-genome level. With considerable gene expressional and phenotypic divergence between wild and cultivated rice, the panicle might have been an major target for artificial selection during domestication, a hypothesis consistent with the finding that many yield-related traits are associated with panicles <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>.</p>
            <p>The above results, i.e., the CHH methylation tree&#8217;s inconsistency with the genomic tree and the low correlation between non-CG methylation divergence and genetic divergence, imply that high-level methylation in CG context might be more conserved than low-level methylation in CHG and CHH contexts among species. To further test this hypothesis, we calculated the coefficient of variation (CV) using a sliding window of the methylation level for each of the CG, CHG and CHH context to measure their conservation levels among species. Our results show that CG methylation has the lowest variation (8.6%), followed by CHG (11.0%) and CHH (13.7%), consistent with the decrease of their methylation level in the same order. In addition, we calculated the correlation coefficient between methylation level and its CV among four samples in gene regions for each sequence context. We found that gene methylation level showed significant negative correlation with its CV regardless of sequence contexts (Figure <figr fid="F5">5</figr>d). These results suggested that high-level methylation states are more stable during evolution.</p>
            <p>To examine the methylation variation among species in different functional elements, we calculated the CVs of methylation level for mCs located in gene, promoter, TTR and TE regions (Additional file <supplr sid="S6">6</supplr>). We found that TEs&#8217; methylation status is most conserved among species with the smallest CV, followed by genes, promoters and TTRs, consistent with the previous observation in <it>Arabidopsis</it><abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. The methylation conservation levels of different functional elements also follow their methylation levels, again suggesting that high-level methylation states are more stable among species. Further, we compared the methylation variations among different location and sequence contexts in the same methylation level groups. We found that mCs with similar methylation levels have similar variations regardless of their genomic location or sequence contexts (Additional file <supplr sid="S7">7</supplr>), demonstrating that methylation level is a consistent indicator of methylation variation among species.</p>
            <suppl id="S6">
               <title>
                  <p>Additional file 6</p>
               </title>
               <text>
                  <p>
                     <b>Coefficient of variation (CV) of methylation level for methylcytosine among species in different functional elements.</b>
                  </p>
               </text>
               <file name="1471-2164-13-300-S6.xls">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S7">
               <title>
                  <p>Additional file 7</p>
               </title>
               <text>
                  <p><b>Coefficient of variation (CV) of methylation level for methylcytosine among species in different functional elements and sequence context in different methylation level groups.</b> (a) CG context (b) CHG context (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S7.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Identification of differentially-methylated genes between cultivated rice and wild rice</p>
            </st>
            <p>To identify the DNA methylation changes that may be associated with rice domestication, we identified in cultivated rice 14/24/49 methylation-upregulated and 21/10/46 methylation-downregulated genes in promoter, TTR and gene body regions respectively, leading to a total of 155 non-redundant differentially-methylated genes between cultivated and wild rice (Additional file <supplr sid="S8">8</supplr>). We also picked 6 promoter or TTR regions in total to validate such methylation differentiation between cultivated and wild rice using the traditional bisulfite sequencing method for single genes, and the results conform to those from our whole genome BS-Seq analyses (Additional files <supplr sid="S9">9</supplr><supplr sid="S10">10</supplr><supplr sid="S11">11</supplr><supplr sid="S12">12</supplr><supplr sid="S13">13</supplr>,and <supplr sid="S14">14</supplr>), indicating the reliability of our BS-Seq results. Among the 155 genes, 11 (7.1%) show methylation-correlated 2-fold gene expression changes, but the proportion of genes with such expressional changes among differentially methylated genes is not significantly different from the proportion of all genes showing 2-fold gene expression changes between cultivated and wild rice regardless whether there is DNA methylation difference. Interestingly, a similar conclusion has also been drawn among natural accessions of <it>Arabidopsis thaliana</it> in which only 6% of differentially methylated genes have significantly different expression levels between ecotypes, and the proportion of expression-altered genes is the same as that among all genes <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. The results from both rice and <it>Arabidopsis</it> suggest that a variety of mechanisms, including genetic changes in genes&#8217; <it>cis</it>- or <it>trans-</it>regulators and chromatin modification, together with DNA methylation, regulate gene expression at the genomic level. However, it is also possible that subtle (less than two-fold) changes in gene expression caused by DNA methylation differences could have important consequences, particularly if those genes are of major or multiple effects. In the case of rice domestication, therefore, it still cannot be ruled out that a few key genes&#8217; epigenetic and correlated expressional changes might have played important roles in the production of some important agronomic traits in cultivated rice <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. Given the small sample size in this study, methylomic and transcriptomic analysis of more representative wild and cultivated rice is needed to further clarify this important issue.</p>
            <suppl id="S8">
               <title>
                  <p>Additional file 8</p>
               </title>
               <text>
                  <p>
                     <b>List of differentially methylated genes between cultivated and wild rice.</b>
                  </p>
               </text>
               <file name="1471-2164-13-300-S8.xls">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S9">
               <title>
                  <p>Additional file 9</p>
               </title>
               <text>
                  <p><b>Validation results for the promoter region of Os12g0264800 gene using the traditional bisulfite sequencing method.</b>In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S9.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S10">
               <title>
                  <p>Additional file 10</p>
               </title>
               <text>
                  <p><b>Validation results of TTR region of Os11g0111101 gene by traditional bisulfite sequencing.</b> In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S10.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S11">
               <title>
                  <p>Additional file 11</p>
               </title>
               <text>
                  <p><b>Validation results of promoter region of Os01g0116800 gene by traditional bisulfite sequencing. </b>In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S11.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S12">
               <title>
                  <p>Additional file 12</p>
               </title>
               <text>
                  <p><b>Validation results of promoter region of Os01g0543000 gene by traditional bisulfite sequencing.</b> In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S12.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S13">
               <title>
                  <p>Additional file 13</p>
               </title>
               <text>
                  <p><b>Validation results of promoter region of Os04g0431700 gene by traditional bisulfite sequencing.</b> In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S13.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
            <suppl id="S14">
               <title>
                  <p>Additional file 14</p>
               </title>
               <text>
                  <p><b>Validation results of TTR region of Os08g0150200 gene by traditional bisulfite sequencing.</b> In each panel, the top histogram shows the validation results from traditional bisulfite sequencing and the bottom shows the BS-Seq results. Methylation level of individual cytosine sites located on the genome (indicated on the x-axis) is shown on the y-axis. (a) CG context. (b) CHG context. (c) CHH context.</p>
               </text>
               <file name="1471-2164-13-300-S14.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusions</p>
         </st>
         <p>The high resolution DNA methylation maps for the two cultivated rice subspecies and their wild ancestors obtained in this study and the integrated analysis of genomic, epigenomic, and transcriptomic data have not only broadened our understanding of the mechanisms of gene regulation and the complicated relationships between DNA divergence, DNA methylation, and gene expression variation in plant genomes, but also provided valuable data for future studies on rice epigenetics as well as on epigenetic differentiation between wild and cultivated rice.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>BS-Seq libraries construction and sequencing</p>
            </st>
            <p>To make our methylomes from four samples comparable, we carefully collected all samples at the same developmental stage of panicle initiation to booting. This stage is an important time point, at which rice start transitioning from vegetative growth to reproductive growth.</p>
            <p>A single young panicle from each of the cultivated rice subspecies and the two wild rice species was ground in liquid nitrogen to fine powder using mortar and pestle. Genomic DNAs were isolated using the Plant Genomic DNA Purification Kit (Tiangen Inc., China) and total RNAs were isolated using the RNeasy Plant Mini Kit (Qiagen Inc., Germany). DNA was fragmented by sonication with the Diagenome sonicator to a mean size of approximately 250&#8201;bp, followed by blunting, 3&#8217;-end addition of dA, and adaptor ligation according to the manufacturer&#8217;s instruction (Illumina). The bisulfite conversion of rice DNA was carried out using a modified (NH<sub>4</sub>)HSO<sub>3</sub>-based protocol <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Bisulfite-treated DNAs were PCR amplified with 16 cycles. The resultant DNAs were applied to paired-end sequencing with the read length of 44 or 75 nt for each end using the ultrahigh-throughput Illumina Genetic Analyzer (GA 2) as per the manufacturer&#8217;s instructions.</p>
         </sec>
         <sec>
            <st>
               <p>Mapping and processing of BS-Seq reads</p>
            </st>
            <p>Because <it>japonica</it> rice has high quality reference genome sequence and gene annotation information, all reads from four rice samples were mapped to the Nipponbare IRGSP genome sequence (build 4 assembly), which was downloaded from RAP-DB (<url>http://rapdblegacy.dna.affrc.go.jp/archive/build4/OsGenome_RAP2.tar.gz</url>). Since DNA methylation has strand specificity, the plus strand and the minus strand of Nipponbare genome should be separated and used as different alignment target sequences for BS-Seq reads. That is, each cytosine in reference genome sequences was converted to thymine, termed T-genome which represents the plus strand. Meanwhile, each guanine in reference genome sequences was converted to adenosine, termed A-genome which represents the minus strand. To map the raw 44 or 75 nt pair-ended BS-Seq reads, the original reads were computationally converted to the alignment forms with the following steps: 1) observed cytosines on the forward read of each read pair were <it>in silico</it> replaced by thymines; 2) observed guanines on the reverse read of each read pair were <it>in silico</it> replaced by adenosines. The converted reads were then mapped to both strands of the A- and T- genome sequence using SOAP2 allowing up to two mismatches for 44 nt reads and four mismatches for 75 nt reads <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. Reads mapped to the same start position for both ends were regarded as clonal duplicates, which might have been generated during PCR process, and only one of them was kept. Only reads uniquely mapped to either of the strands were then retained for further analysis. After above filtration, for methylcytosine (mC) detection, we transformed each aligned read and the two strands of the Nipponbare genome back to their original forms to build an alignment between the original forms. Cytosines in the BS-Seq reads matching the corresponding cytosines in the plus strand of the reference genome, or guanines in the BS-Seq reads matching the corresponding guanines in the minus strand of the reference genome will be regarded as potential mCs. To exclude the false positive caused by base calling process, we removed those potential mCs with Q scores lower than 20, which means that a base is correctly called at more than 99% probability, a highly conservative criterion for calling reliable bases.</p>
            <p>We used the unmethylated chloroplast genome <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> to calculate the sum of non-conversion rate and T-C sequencing error rate, and then conducted binomial tests using these values with false positive rate below 5% to exclude those mCs that may be the results of non-conversion of cytosines during our bisulfite treatment or T to C sequencing errors during base calling process.</p>
            <p>The method of mapping BS-seq reads has been successfully applied in profiling the silk gland methylome of silkworm and the peripheral blood mononuclear cell methylome of humans <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B35">35</abbr></abbrgrp>. In these published studies as well as in this study, experimental validation confirmed the reliability of mC calling. To further compare the performance between our pipeline and other reported softwares, we chose data from one lane of <it>japonica</it> sample (17,406,765 paired reads) and the plus strand of chromosome01 to call mCs using both our method and Bismark <abbrgrp><abbr bid="B36">36</abbr></abbrgrp> with the same parameters (because BS seeker <abbrgrp><abbr bid="B37">37</abbr></abbrgrp> does not support paired-end reads, we could not use BS seeker to do the comparison). The results showed that in general the two methods gave very similar results. For example, 92%, 91% and 95% mCs for CG, CHG and CHH sequence context called by Bismark were also identified by our method. And the methylation levels obtained using two methods show high correlation for each sequence context (see Table <tblr tid="T4">4</tblr> for details). Furthermore, our method shows slightly higher sensitivity than Bismark, which could be caused by employing different short reads aligners (our method used SOAP, while Bismark used Bowtie). Therefore, we used mCs called with our pipeline to conduct all following analyses.</p>
            <table id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>
                     <b>Comparison of mC calling between our pipeline and Bismark</b>
                  </p>
               </caption>
               <tgroup align="left" cols="4">
                  <colspec align="left" colname="c1" colnum="1" colwidth="1*"/>
                  <colspec align="left" colname="c2" colnum="2" colwidth="1*"/>
                  <colspec align="left" colname="c3" colnum="3" colwidth="1*"/>
                  <colspec align="left" colname="c4" colnum="4" colwidth="1*"/>
                  <thead valign="top">
                     <row rowsep="1">
                        <entry colname="c1"/>
                        <entry colname="c2">
                           <p>
                              <b>Called by both</b>
                           </p>
                        </entry>
                        <entry colname="c3">
                           <p>
                              <b>Called only by Bismark</b>
                           </p>
                        </entry>
                        <entry colname="c4">
                           <p>
                              <b>Called only by our method</b>
                           </p>
                        </entry>
                     </row>
                  </thead>
                  <tbody valign="top">
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>414,168</p>
                        </entry>
                        <entry colname="c3">
                           <p>31,180</p>
                        </entry>
                        <entry colname="c4">
                           <p>43,897</p>
                        </entry>
                     </row>
                     <row>
                        <entry colname="c1">
                           <p>
                              <b>CHG</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>217,820</p>
                        </entry>
                        <entry colname="c3">
                           <p>20,356</p>
                        </entry>
                        <entry colname="c4">
                           <p>31,183</p>
                        </entry>
                     </row>
                     <row rowsep="1">
                        <entry colname="c1">
                           <p>
                              <b>CHH</b>
                           </p>
                        </entry>
                        <entry colname="c2">
                           <p>282,825</p>
                        </entry>
                        <entry colname="c3">
                           <p>16,525</p>
                        </entry>
                        <entry colname="c4">
                           <p>33,705</p>
                        </entry>
                     </row>
                  </tbody>
               </tgroup>
            </table>
         </sec>
         <sec>
            <st>
               <p>SNPs calling using BS-Seq reads</p>
            </st>
            <p>Because DNA methylation has strand specificity, BS-Seq reads mapped to T-genome contain the DNA sequence information of plus strand, while reads mapped to A-genome contain the information of minus strand. Thus we could use BS-Seq reads to call SNPs directly for both plus and minus strands for each sample. After mapping and processing of BS-Seq reads described in above step, SNPs in both strands were called using Samtools <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. To get high-quality SNPs, we used strict standards for our results&#8212;only bases with base quality (Q score) of at least 30 and positions covered by at least 5 reads were used for our SNP calling process. Although bisulfite treatment will convert C to T in both strands which will affect judgment of some kinds of genotypes during SNPs calling process, we can use SNP information from both strands to solve this problem. Some genotypes (A/G, G/A, C/A, C/G, T/A, T/G, A/A, G/G, the former indicates reference base and latter indicates sample&#8217;s base) can be correctly called using results from plus strand, while the other genotypes (A/C, A/T, G/T, G/C, C/T, T/C, T/T, C/C) can be correctly called using results from minus strand. Under this principle, a total of 37,141, 50,340, 65,680, and 83,594 high-quality SNPs in <it>japonica</it><it>indica</it><it>O. rufipogon</it>, and <it>O. nivara</it> were obtained respectively and used for further analysis.</p>
         </sec>
         <sec>
            <st>
               <p>Validation of BS-Seq results</p>
            </st>
            <p>To verify the BS-Seq results, we picked 6 regions, including 4 promoter regions (Os12g0264800, Os01g0116800, Os01g0543000, and Os04g0431700 genes) and 2 TTR regions (Os11g0111101 and Os08g0150200 genes), to validate the methylation status in all the four samples using the traditional bisulfite sequencing method for single genes.</p>
         </sec>
         <sec>
            <st>
               <p>Digital Gene Expression (DGE) tag libraries construction</p>
            </st>
            <p>DGE-tag libraries were constructed from the total RNAs isolated from the same four rice panicles used for extracting DNA with the DGE-Tag Profiling NlaIII Sample Prep Kit (Illumina) according to the manufacturer&#8217;s instructions.</p>
         </sec>
         <sec>
            <st>
               <p>Mapping and processing of Digital Gene Expression (DGE) tags</p>
            </st>
            <p>Full-length cDNA sequences of rice genes were downloaded from RAP-DB (<url>http://rapdblegacy.dna.affrc.go.jp/archive/build4/rep_RAP2.tar.gz</url>). A total of 24,955 genes supported with full length cDNA were used for DGE analysis. All possible CATG&#8201;+&#8201;17nt tag sequences were created from 24,955 full-length cDNAs and used as the reference tag database. Unique tag sequences and their numbers were extracted from our raw DGE tags and these tags were aligned against the reference tag database using SOAP <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. Only perfect matches were kept for further analysis. Within genes, most of the DGE tags were mapped to the most 3&#8217;-end CATG sites of genes (Additional file <supplr sid="S15">15</supplr>), suggesting that transcriptional termination sites of most rice genes we used were annotated correctly and that performing DGE analysis for those genes was suitable and reliable. The expression level of a gene was represented by the total number of tags that uniquely aligned to that gene. Gene expression levels were normalized to tag number per million tags for gene expression comparisons among different samples.</p>
            <suppl id="S15">
               <title>
                  <p>Additional file 15</p>
               </title>
               <text>
                  <p><b>Distribution of DGE tags across CATG sites within genes and gene numbers supported by DGE tags from different CATG sites.</b> (a) japonica. (b) indica. (c) O. rufipogon. (d) O. nivara. For each panel, x-axis indicates CATG site positions from 3&#8217;-end of genes, while y-axis in left indicates the corresponding numbers of total tags mapped to different CATG positions and y-axis in right indicates the corresponding gene numbers supported by DGE tags mapped to different CATG sites.</p>
               </text>
               <file name="1471-2164-13-300-S15.pdf">
   <p>Click here for file</p>
</file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Methylation level, TE and smRNA density analyses</p>
            </st>
            <p>Annotation of TEs was downloaded from RAP-DB (<url>http://rapdblegacy.dna.affrc.go.jp/archive/build4/OsNIAS_b4_chromOut.tar.gz</url>) and smRNA sequences were downloaded from rice MPSS database (<url>http://mpss.udel.edu/data-files/rice/small/smallRNA_summary.txt</url>). Sequences of smRNAs were mapped to the rice reference genome using SOAP <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> without allowing mismatch, and uniquely mapped smRNAs were used for further analysis. Methylation level refers to the proportion of reads showing mC among all reads covering the same cytosine site. It can further be classified as absolute methylation level (total methylation level of mCs divided by the total sequence length of the calculated region) and relative methylation level (total methylation level of mCs divided by total number of cytosine sites in the calculated region), both of which were used for our analysis. TE or smRNA density was defined as the ratio of the number of bases belonging to TEs or smRNAs to the total length of the calculated region.</p>
         </sec>
         <sec>
            <st>
               <p>Methylation-expression correlation analysis for <it>Arabidopsis</it></p>
            </st>
            <p>The single-base methylation profile and corresponding gene expression profile of <it>Arabidopsis</it> were downloaded from NCBI SRA (Sequence Read Archive) database (<url>http://www.ncbi.nlm.nih.gov/sra</url>, the accession numbers are SRA000284 for BS-Seq, also referred as MethylC-Seq in Lister <it>et. al.</it>&#8217;s paper <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, and SRA000286 for mRNA-seq). The genome sequences and gene annotation information (TAIR9) were downloaded from the ftp site of TAIR (The <it>Arabidopsis</it> Information Resource, <url>ftp://ftp.arabidopsis.org/home/tair/</url>). The method of mapping and processing of BS-Seq reads is the same as that used in rice. Mapping and processing of mRNA-seq reads were conducted using TopHat software <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. Gene expression levels, measured by reads per kilobase of transcript per million reads (RPKM), was also calculated using TopHat. Methylation-expression correlation analyses for <it>Arabidopsis</it> were performed with the same methods as used for rice.</p>
         </sec>
         <sec>
            <st>
               <p>Construction of methylation, genomic and expression trees</p>
            </st>
            <p>For methylation tree construction, we first calculated the absolute methylation level in sliding windows of 50&#8201;kb with steps of 25&#8201;kb across the whole genome for the four samples, and then clustered the samples based on pairwise Spearman correlation coefficients estimated from the above whole genome sliding methylation level matrix. Methylation levels of all mCs with&#8201;&#8805;&#8201;5&#8201;&#215;&#8201;coverage of the whole genome were also used to calculate the pairwise Spearman correlation coefficients among samples, which in turn produced similar methylation tree. High-quality SNPs called from BS-Seq reads were used to construct genomic tree among the four samples using <it>p</it> distance and neighbor-joining method implemented in MEGA <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. Finally, an expression tree was constructed using pairwise Spearman expression correlation coefficients among the four samples based on DGE data. Methylation and expression trees were constructed using the hclust function of R statistical software (<url>http://www.r-project.org/</url>).</p>
         </sec>
         <sec>
            <st>
               <p>Examination of the relationship between genetic divergence and methylation divergence</p>
            </st>
            <p>To examine the relationship between genetic and methylation divergence, the average number of nucleotide differences per site among samples for different genomic regions was calculated using SNPs obtained from the above step with 50&#8201;kb sliding window and a step of 25&#8201;kb through the whole genome, which was used to measure genetic divergence. Then average Spearman correlation coefficients of methylation level of all cytosines with&#8201;&#8805;&#8201;5&#8201;&#215;&#8201;coverage among samples were calculated for same sliding windows and used to measure methylation divergence in different genomic regions.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of differentially methylated genes between cultivated and wild rice</p>
            </st>
            <p>Because mCs in promoters, TTRs and gene bodies have significant effects on gene expression, we identified genes with different methylation status in these three regions among the four rice samples. Only regions with above 80% sequencing coverage were used for further analysis. Methylation levels of all Cs within promoters/TTRs/gene-bodies were calculated and used to perform two-sample Wilcoxon rank sum tests between any samples. Differentially-methylated genes were identified for each pairwise comparison using a significance level of <it>alpha</it>&#8201;&lt;&#8201;0.05. Genes that are significantly methylation-upregulated or methylation-downregulated consistently in all cultivated vs. wild rice pairwise comparisons but are not significantly different within cultivated or wild rice comparisons were respectively identified as methylation-upregulated or methylation-downregulated genes between cultivated and wild rice.</p>
         </sec>
         <sec>
            <st>
               <p>Accession codes</p>
            </st>
            <p>The methylome data have been deposited into the NCBI Short Read Archive (SRA, <url>http://www.ncbi.nlm.nih.gov/sra/</url>) under accession number SRA012190 and DGE data have been deposited into the NCBI Gene Expression Omnibus (GEO, <url>http://www.ncbi.nlm.nih.gov/geo</url>) under accession number GSE20871.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>TTRs, transcriptional termination regions; BS-Seq, bisulfite-treated genomic DNA sequencing; mC, methylated cytosine; TEs, transposable elements; DGE, Digital Gene Expression tag profiling; SAGE, Serial Analysis of Gene Expression; FL-cDNAs, nonredundant full-length cDNAs; CV, coefficient of variation.</p>
      </sec>
      <sec>
         <st>
            <p>Competing interests</p>
         </st>
         <p>The authors declare that they have no competing interests.</p>
      </sec>
      <sec>
         <st>
            <p>Authors&#8217; contributions</p>
         </st>
         <p>WW, JW, JZ and SG designed the study. XL, WW, HX, XX, XC and JW wrote the manuscript. FH, XZ, SG, SZ and QL collected the samples. JZ, JY, XZ and HX constructed the BS-Seq libraries and conducted the BS validation. MY, GZ, RL, CY performed the Illumina sequencing. XL, HX, FH, and XX performed the data analyses. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgments</p>
            </st>
            <p>We are grateful to Keyan Zhao, Haiyi Wang, Eric Richards, and Peter Lipke for their helpful discussions and comments on the work, and to the International Rice Research Institute (Los Banos, Philippines) for providing the seed samples of the two wild rice species. This work was supported by the Chinese 973 program (2007CB815700, 2005CB121000, 2009CB825606 and 2009CB825607), the Provincial Key Grant of Yunnan Province (2008CC017; 2008GA002), the National Natural Science Foundation of China (U0836605, 30921140312 and 30872963), the Shenzhen Municipal Government and the Yantian District local government of Shenzhen, the Ole R&#248;mer grant from the Danish Natural Science Research Council, a CAS-Max Planck Society Fellowship, the 100 talent program of CAS, a Shanghai Science Foundation grant (07DJ14074), and a European 6th program grant (LSHB-CT-2005-019067) to WW, JW, SG or JZ.</p>
         </sec>
      </ack>
      <refgrp><bibl id="B1"><title><p>DNA methylation landscapes: provocative insights from epigenomics</p></title><aug><au><snm>Suzuki</snm><fnm>MM</fnm></au><au><snm>Bird</snm><fnm>A</fnm></au></aug><source>Nat Rev Genet</source><pubdate>2008</pubdate><volume>9</volume><fpage>465</fpage><lpage>476</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">18463664</pubid></xrefbib></bibl><bibl id="B2"><title><p>Inherited epigenetic variation &#8211; revisiting soft inheritance</p></title><aug><au><snm>Richards</snm><fnm>EJ</fnm></au></aug><source>Nat Rev Genet</source><pubdate>2006</pubdate><volume>7</volume><fpage>395</fpage><lpage>401</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">16534512</pubid></xrefbib></bibl><bibl id="B3"><title><p>Epialleles via DNA methylation: consequences for plant evolution</p></title><aug><au><snm>Kalisz</snm><fnm>S</fnm></au><au><snm>Purugganan</snm><fnm>MD</fnm></au></aug><source>Trends in Ecol Evol</source><pubdate>2004</pubdate><volume>19</volume><fpage>309</fpage><lpage>314</lpage><xrefbib><pubid idtype="doi">10.1016/j.tree.2004.03.034</pubid></xrefbib></bibl><bibl id="B4"><title><p>A naturally occurring epigenetic mutation in a gene encoding an SBP-box transcription factor inhibits tomato fruit ripening</p></title><aug><au><snm>Manning</snm><fnm>K</fnm></au><au><snm>Tor</snm><fnm>M</fnm></au><au><snm>Poole</snm><fnm>M</fnm></au><au><snm>Hong</snm><fnm>Y</fnm></au><au><snm>Thompson</snm><fnm>AJ</fnm></au><au><snm>King</snm><fnm>GJ</fnm></au><au><snm>Giovannoni</snm><fnm>JJ</fnm></au><au><snm>Seymour</snm><fnm>GB</fnm></au></aug><source>Nat Genet</source><pubdate>2006</pubdate><volume>38</volume><fpage>948</fpage><lpage>952</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/ng1841</pubid><pubid idtype="pmpid" link="fulltext">16832354</pubid></pubidlist></xrefbib></bibl><bibl id="B5"><title><p>An epigenetic mutation responsible for natural variation in floral symmetry</p></title><aug><au><snm>Cubas</snm><fnm>P</fnm></au><au><snm>Vincent</snm><fnm>C</fnm></au><au><snm>Coen</snm><fnm>E</fnm></au></aug><source>Nature</source><pubdate>1999</pubdate><volume>401</volume><fpage>157</fpage><lpage>161</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/43657</pubid><pubid idtype="pmpid" link="fulltext">10490023</pubid></pubidlist></xrefbib></bibl><bibl id="B6"><title><p>Hypermethylated SUPERMAN epigenetic alleles in Arabidopsis</p></title><aug><au><snm>Jacobsen</snm><fnm>SE</fnm></au><au><snm>Meyerowitz</snm><fnm>EM</fnm></au></aug><source>Science</source><pubdate>1997</pubdate><volume>277</volume><fpage>1100</fpage><lpage>1103</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.277.5329.1100</pubid><pubid idtype="pmpid" link="fulltext">9262479</pubid></pubidlist></xrefbib></bibl><bibl id="B7"><title><p>Epigenetic inheritance at the agouti locus in the mouse</p></title><aug><au><snm>Morgan</snm><fnm>HD</fnm></au><au><snm>Sutherland</snm><fnm>HGE</fnm></au><au><snm>Martin</snm><fnm>DIK</fnm></au><au><snm>Whitelaw</snm><fnm>E</fnm></au></aug><source>Nat Genet</source><pubdate>1999</pubdate><volume>23</volume><fpage>314</fpage><lpage>318</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/15490</pubid><pubid idtype="pmpid" link="fulltext">10545949</pubid></pubidlist></xrefbib></bibl><bibl id="B8"><title><p>The late flowering phenotype of fwa mutants is caused by gain-of-function epigenetic alleles of a homeodomain gene</p></title><aug><au><snm>Soppe</snm><fnm>WJJ</fnm></au><au><snm>Jacobsen</snm><fnm>SE</fnm></au><au><snm>Alonso-Blanco</snm><fnm>C</fnm></au><au><snm>Jackson</snm><fnm>JP</fnm></au><au><snm>Kakutani</snm><fnm>T</fnm></au><au><snm>Koornneef</snm><fnm>M</fnm></au><au><snm>Peeters</snm><fnm>AJM</fnm></au></aug><source>Mol Cell</source><pubdate>2000</pubdate><volume>6</volume><fpage>791</fpage><lpage>802</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/S1097-2765(05)00090-0</pubid><pubid idtype="pmpid" link="fulltext">11090618</pubid></pubidlist></xrefbib></bibl><bibl id="B9"><title><p>Meiotically stable natural epialleles of Sadhu, a novel Arabidopsis retroposon</p></title><aug><au><snm>Rangwala</snm><fnm>SH</fnm></au><au><snm>Elumalai</snm><fnm>R</fnm></au><au><snm>Vanier</snm><fnm>C</fnm></au><au><snm>Ozkan</snm><fnm>H</fnm></au><au><snm>Galbraith</snm><fnm>DW</fnm></au><au><snm>Richards</snm><fnm>EJ</fnm></au></aug><source>PLoS Genet</source><pubdate>2006</pubdate><volume>2</volume><fpage>e36</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pgen.0020036</pubid><pubid idtype="pmcid">1401498</pubid><pubid idtype="pmpid" link="fulltext">16552445</pubid></pubidlist></xrefbib></bibl><bibl id="B10"><title><p>Metastable epialleles in mammals</p></title><aug><au><snm>Rakyan</snm><fnm>VK</fnm></au><au><snm>Blewitt</snm><fnm>ME</fnm></au><au><snm>Druker</snm><fnm>R</fnm></au><au><snm>Preis</snm><fnm>JI</fnm></au><au><snm>Whitelaw</snm><fnm>E</fnm></au></aug><source>Trends in Genet</source><pubdate>2002</pubdate><volume>18</volume><fpage>348</fpage><lpage>351</lpage><xrefbib><pubid idtype="doi">10.1016/S0168-9525(02)02709-9</pubid></xrefbib></bibl><bibl id="B11"><title><p>A metastable DWARF1 epigenetic mutant affecting plant stature in rice</p></title><aug><au><snm>Miura</snm><fnm>K</fnm></au><au><snm>Agetsuma</snm><fnm>M</fnm></au><au><snm>Kitano</snm><fnm>H</fnm></au><au><snm>Yoshimura</snm><fnm>A</fnm></au><au><snm>Matsuoka</snm><fnm>M</fnm></au><au><snm>Jacobsen</snm><fnm>SE</fnm></au><au><snm>Ashikari</snm><fnm>M</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2009</pubdate><volume>106</volume><fpage>11218</fpage><lpage>11223</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0901942106</pubid><pubid idtype="pmcid">2708680</pubid><pubid idtype="pmpid" link="fulltext">19541604</pubid></pubidlist></xrefbib></bibl><bibl id="B12"><title><p>Shotgun bisulphite sequencing of the Arabidopsis genome reveals DNA methylation patterning</p></title><aug><au><snm>Cokus</snm><fnm>SJ</fnm></au><au><snm>Feng</snm><fnm>S</fnm></au><au><snm>Zhang</snm><fnm>X</fnm></au><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>Merriman</snm><fnm>B</fnm></au><au><snm>Haudenschild</snm><fnm>CD</fnm></au><au><snm>Pradhan</snm><fnm>S</fnm></au><au><snm>Nelson</snm><fnm>SF</fnm></au><au><snm>Pellegrini</snm><fnm>M</fnm></au><au><snm>Jacobsen</snm><fnm>SE</fnm></au></aug><source>Nature</source><pubdate>2008</pubdate><volume>452</volume><fpage>215</fpage><lpage>219</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature06745</pubid><pubid idtype="pmcid">2377394</pubid><pubid idtype="pmpid" link="fulltext">18278030</pubid></pubidlist></xrefbib></bibl><bibl id="B13"><title><p>Highly integrated single-base resolution maps of the epigenome in Arabidopsis</p></title><aug><au><snm>Lister</snm><fnm>R</fnm></au><au><snm>O&apos;Malley</snm><fnm>RC</fnm></au><au><snm>Tonti-Filippini</snm><fnm>J</fnm></au><au><snm>Gregory</snm><fnm>BD</fnm></au><au><snm>Berry</snm><fnm>CC</fnm></au><au><snm>Millar</snm><fnm>AH</fnm></au><au><snm>Ecker</snm><fnm>JR</fnm></au></aug><source>Cell</source><pubdate>2008</pubdate><volume>133</volume><fpage>523</fpage><lpage>536</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.cell.2008.03.029</pubid><pubid idtype="pmcid">2723732</pubid><pubid idtype="pmpid" link="fulltext">18423832</pubid></pubidlist></xrefbib></bibl><bibl id="B14"><title><p>Human DNA methylomes at base resolution show widespread epigenomic differences</p></title><aug><au><snm>Lister</snm><fnm>R</fnm></au><au><snm>Pelizzola</snm><fnm>M</fnm></au><au><snm>Dowen</snm><fnm>RH</fnm></au><au><snm>Hawkins</snm><fnm>RD</fnm></au><au><snm>Hon</snm><fnm>G</fnm></au><au><snm>Tonti-Filippini</snm><fnm>J</fnm></au><au><snm>Nery</snm><fnm>JR</fnm></au><au><snm>Lee</snm><fnm>L</fnm></au><au><snm>Ye</snm><fnm>Z</fnm></au><au><snm>Ngo</snm><fnm>Q-M</fnm></au><etal/></aug><source>Nature</source><pubdate>2009</pubdate><volume>462</volume><fpage>315</fpage><lpage>322</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nature08514</pubid><pubid idtype="pmcid">2857523</pubid><pubid idtype="pmpid" link="fulltext">19829295</pubid></pubidlist></xrefbib></bibl><bibl id="B15"><title><p>Single base-resolution methylome of the silkworm reveals a sparse epigenomic map</p></title><aug><au><snm>Xiang</snm><fnm>H</fnm></au><au><snm>Zhu</snm><fnm>J</fnm></au><au><snm>Chen</snm><fnm>Q</fnm></au><au><snm>Dai</snm><fnm>F</fnm></au><au><snm>Li</snm><fnm>X</fnm></au><au><snm>Li</snm><fnm>M</fnm></au><au><snm>Zhang</snm><fnm>H</fnm></au><au><snm>Zhang</snm><fnm>G</fnm></au><au><snm>Li</snm><fnm>D</fnm></au><au><snm>Dong</snm><fnm>Y</fnm></au></aug><source>Nat Biotechnol</source><pubdate>2010</pubdate><volume>28</volume><fpage>516</fpage><lpage>520</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nbt.1626</pubid><pubid idtype="pmpid" link="fulltext">20436463</pubid></pubidlist></xrefbib></bibl><bibl id="B16"><title><p>High-resolution mapping of epigenetic modifications of the rice genome uncovers interplay between DNA methylation, histone methylation, and gene expression</p></title><aug><au><snm>Li</snm><fnm>X</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>He</snm><fnm>K</fnm></au><au><snm>Ma</snm><fnm>Y</fnm></au><au><snm>Su</snm><fnm>N</fnm></au><au><snm>He</snm><fnm>H</fnm></au><au><snm>Stolc</snm><fnm>V</fnm></au><au><snm>Tongprasit</snm><fnm>W</fnm></au><au><snm>Jin</snm><fnm>W</fnm></au><au><snm>Jiang</snm><fnm>J</fnm></au><etal/></aug><source>Plant Cell</source><pubdate>2008</pubdate><volume>20</volume><fpage>259</fpage><lpage>276</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1105/tpc.107.056879</pubid><pubid idtype="pmcid">2276441</pubid><pubid idtype="pmpid" link="fulltext">18263775</pubid></pubidlist></xrefbib></bibl><bibl id="B17"><title><p>Global epigenetic and transcriptional trends among two rice subspecies and their reciprocal hybrids</p></title><aug><au><snm>He</snm><fnm>G</fnm></au><au><snm>Zhu</snm><fnm>X</fnm></au><au><snm>Elling</snm><fnm>AA</fnm></au><au><snm>Chen</snm><fnm>L</fnm></au><au><snm>Wang</snm><fnm>X</fnm></au><au><snm>Guo</snm><fnm>L</fnm></au><au><snm>Liang</snm><fnm>M</fnm></au><au><snm>He</snm><fnm>H</fnm></au><au><snm>Zhang</snm><fnm>H</fnm></au><au><snm>Chen</snm><fnm>F</fnm></au><etal/></aug><source>Plant Cell</source><pubdate>2010</pubdate><volume>22</volume><fpage>17</fpage><lpage>33</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1105/tpc.109.072041</pubid><pubid idtype="pmcid">2828707</pubid><pubid idtype="pmpid" link="fulltext">20086188</pubid></pubidlist></xrefbib></bibl><bibl id="B18"><title><p>Genome-wide evolutionary analysis of eukaryotic DNA methylation</p></title><aug><au><snm>Zemach</snm><fnm>A</fnm></au><au><snm>McDaniel</snm><fnm>IE</fnm></au><au><snm>Silva</snm><fnm>P</fnm></au><au><snm>Zilberman</snm><fnm>D</fnm></au></aug><source>Science</source><pubdate>2010</pubdate><volume>328</volume><fpage>916</fpage><lpage>919</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1186366</pubid><pubid idtype="pmpid" link="fulltext">20395474</pubid></pubidlist></xrefbib></bibl><bibl id="B19"><title><p>Conservation and divergence of methylation patterning in plants and animals</p></title><aug><au><snm>Feng</snm><fnm>S</fnm></au><au><snm>Cokus</snm><fnm>SJ</fnm></au><au><snm>Zhang</snm><fnm>X</fnm></au><au><snm>Chen</snm><fnm>PY</fnm></au><au><snm>Bostick</snm><fnm>M</fnm></au><au><snm>Goll</snm><fnm>MG</fnm></au><au><snm>Hetzel</snm><fnm>J</fnm></au><au><snm>Jain</snm><fnm>J</fnm></au><au><snm>Strauss</snm><fnm>SH</fnm></au><au><snm>Halpern</snm><fnm>ME</fnm></au><etal/></aug><source>Proceedings of the National Academy of Sciences</source><pubdate>2010</pubdate><volume>107</volume><fpage>8689</fpage><lpage>8694</lpage><xrefbib><pubid idtype="doi">10.1073/pnas.1002720107</pubid></xrefbib></bibl><bibl id="B20"><aug><au><snm>Yoshida</snm><fnm>S</fnm></au></aug><source>Fundamentals of rice crop science</source><publisher>Laguna, Philippines: International Institute of Rice Research</publisher><pubdate>1981</pubdate></bibl><bibl id="B21"><title><p>Cytosine methylation of plastid genome in higher plants</p></title><aug><au><snm>Fojtova</snm><fnm>M</fnm></au><au><snm>Kovarik</snm><fnm>A</fnm></au><au><snm>Matyasek</snm><fnm>R</fnm></au></aug><source>Fact or artefact. Plant Sci</source><pubdate>2001</pubdate><volume>160</volume><fpage>585</fpage><lpage>593</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">11448733</pubid></xrefbib></bibl><bibl id="B22"><title><p>DNA methylation profiling identifies CG methylation clusters in Arabidopsis genes</p></title><aug><au><snm>Tran</snm><fnm>RK</fnm></au><au><snm>Henikoff</snm><fnm>JG</fnm></au><au><snm>Zilberman</snm><fnm>D</fnm></au><au><snm>Ditt</snm><fnm>RF</fnm></au><au><snm>Jacobsen</snm><fnm>SE</fnm></au><au><snm>Henikoff</snm><fnm>S</fnm></au></aug><source>Curr Biol</source><pubdate>2005</pubdate><volume>15</volume><fpage>154</fpage><lpage>159</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.cub.2005.01.008</pubid><pubid idtype="pmpid" link="fulltext">15668172</pubid></pubidlist></xrefbib></bibl><bibl id="B23"><title><p>Cytogenetics for the model system Arabidopsis thaliana</p></title><aug><au><snm>Fransz</snm><fnm>P</fnm></au><au><snm>Armstrong</snm><fnm>S</fnm></au><au><snm>Alonsoblanco</snm><fnm>C</fnm></au><au><snm>Fischer</snm><fnm>TC</fnm></au><au><snm>Torresruiz</snm><fnm>RA</fnm></au><au><snm>Jones</snm><fnm>G</fnm></au></aug><source>Plant J</source><pubdate>1998</pubdate><volume>13</volume><fpage>867</fpage><lpage>876</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1046/j.1365-313X.1998.00086.x</pubid><pubid idtype="pmpid" link="fulltext">9681023</pubid></pubidlist></xrefbib></bibl><bibl id="B24"><title><p>Toward a cytological characterization of the rice genome</p></title><aug><au><snm>Cheng</snm><fnm>Z</fnm></au><au><snm>Buell</snm><fnm>CR</fnm></au><au><snm>Wing</snm><fnm>RA</fnm></au><au><snm>Gu</snm><fnm>M</fnm></au><au><snm>Jiang</snm><fnm>J</fnm></au></aug><source>Genome Res</source><pubdate>2001</pubdate><volume>11</volume><fpage>2133</fpage><lpage>2141</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.194601</pubid><pubid idtype="pmcid">311230</pubid><pubid idtype="pmpid" link="fulltext">11731505</pubid></pubidlist></xrefbib></bibl><bibl id="B25"><title><p>Genome-wide high-resolution mapping and functional analysis of DNA methylation in Arabidopsis</p></title><aug><au><snm>Zhang</snm><fnm>X</fnm></au><au><snm>Yazaki</snm><fnm>J</fnm></au><au><snm>Sundaresan</snm><fnm>A</fnm></au><au><snm>Cokus</snm><fnm>S</fnm></au><au><snm>Chan</snm><fnm>SW</fnm></au><au><snm>Chen</snm><fnm>H</fnm></au><au><snm>Henderson</snm><fnm>IR</fnm></au><au><snm>Shinn</snm><fnm>P</fnm></au><au><snm>Pellegrini</snm><fnm>M</fnm></au><au><snm>Jacobsen</snm><fnm>SE</fnm></au><etal/></aug><source>Cell</source><pubdate>2006</pubdate><volume>126</volume><fpage>1189</fpage><lpage>1201</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1016/j.cell.2006.08.003</pubid><pubid idtype="pmpid" link="fulltext">16949657</pubid></pubidlist></xrefbib></bibl><bibl id="B26"><title><p>Dynamic changes in the human methylome during differentiation</p></title><aug><au><snm>Laurent</snm><fnm>L</fnm></au><au><snm>Wong</snm><fnm>E</fnm></au><au><snm>Li</snm><fnm>G</fnm></au><au><snm>Huynh</snm><fnm>T</fnm></au><au><snm>Tsirigos</snm><fnm>A</fnm></au><au><snm>Ong</snm><fnm>CT</fnm></au><au><snm>Low</snm><fnm>HM</fnm></au><au><snm>Kin Sung</snm><fnm>KW</fnm></au><au><snm>Rigoutsos</snm><fnm>I</fnm></au><au><snm>Loring</snm><fnm>J</fnm></au><etal/></aug><source>Genome Res</source><pubdate>2010</pubdate><volume>20</volume><fpage>320</fpage><lpage>331</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1101/gr.101907.109</pubid><pubid idtype="pmcid">2840979</pubid><pubid idtype="pmpid" link="fulltext">20133333</pubid></pubidlist></xrefbib></bibl><bibl id="B27"><title><p>Genome-wide analysis of Arabidopsis thaliana DNA methylation uncovers an interdependence between methylation and transcription</p></title><aug><au><snm>Zilberman</snm><fnm>D</fnm></au><au><snm>Gehring</snm><fnm>M</fnm></au><au><snm>Tran</snm><fnm>RK</fnm></au><au><snm>Ballinger</snm><fnm>T</fnm></au><au><snm>Henikoff</snm><fnm>S</fnm></au></aug><source>Nat Genet</source><pubdate>2007</pubdate><volume>39</volume><fpage>61</fpage><lpage>69</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/ng1929</pubid><pubid idtype="pmpid" link="fulltext">17128275</pubid></pubidlist></xrefbib></bibl><bibl id="B28"><title><p>Nonmethylated transposable elements and methylated genes in a chordate genome</p></title><aug><au><snm>Simmen</snm><fnm>MW</fnm></au><au><snm>Leitgeb</snm><fnm>S</fnm></au><au><snm>Charlton</snm><fnm>J</fnm></au><au><snm>Jones</snm><fnm>SJ</fnm></au><au><snm>nbsp</snm><fnm>M</fnm></au><au><snm>Harris</snm><fnm>BR</fnm></au><au><snm>Clark</snm><fnm>VH</fnm></au><au><snm>Bird</snm><fnm>A</fnm></au></aug><source>Science</source><pubdate>1999</pubdate><volume>283</volume><fpage>1164</fpage><lpage>1167</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.283.5405.1164</pubid><pubid idtype="pmpid" link="fulltext">10024242</pubid></pubidlist></xrefbib></bibl><bibl id="B29"><title><p>DNA demethylation in the Arabidopsis genome</p></title><aug><au><snm>Penterman</snm><fnm>J</fnm></au><au><snm>Zilberman</snm><fnm>D</fnm></au><au><snm>Huh</snm><fnm>JH</fnm></au><au><snm>Ballinger</snm><fnm>T</fnm></au><au><snm>Henikoff</snm><fnm>S</fnm></au><au><snm>Fischer</snm><fnm>RL</fnm></au></aug><source>Proc Natl Acad Sci USA</source><pubdate>2007</pubdate><volume>104</volume><fpage>6752</fpage><lpage>6757</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.0701861104</pubid><pubid idtype="pmcid">1847597</pubid><pubid idtype="pmpid" link="fulltext">17409185</pubid></pubidlist></xrefbib></bibl><bibl id="B30"><title><p>Extensive demethylation of repetitive elements during seed development underlies gene imprinting</p></title><aug><au><snm>Gehring</snm><fnm>M</fnm></au><au><snm>Bubb</snm><fnm>KL</fnm></au><au><snm>Henikoff</snm><fnm>S</fnm></au></aug><source>Science</source><pubdate>2009</pubdate><volume>324</volume><fpage>1447</fpage><lpage>1451</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.1171609</pubid><pubid idtype="pmcid">2886585</pubid><pubid idtype="pmpid" link="fulltext">19520961</pubid></pubidlist></xrefbib></bibl><bibl id="B31"><title><p>Variation within and among species in gene expression: raw material for evolution</p></title><aug><au><snm>Andrew</snm><fnm>W</fnm></au><au><snm>Douglas</snm><fnm>LC</fnm></au></aug><source>Mol Ecol</source><pubdate>2006</pubdate><volume>15</volume><fpage>1197</fpage><lpage>1211</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1111/j.1365-294X.2006.02868.x</pubid><pubid idtype="pmpid" link="fulltext">16626448</pubid></pubidlist></xrefbib></bibl><bibl id="B32"><title><p>Epigenetic natural variation in Arabidopsis thaliana</p></title><aug><au><snm>Vaughn</snm><fnm>MW</fnm></au><au><snm>Tanurd</snm><fnm>MI</fnm></au><au><snm>Lippman</snm><fnm>Z</fnm></au><au><snm>Jiang</snm><fnm>H</fnm></au><au><snm>Carrasquillo</snm><fnm>R</fnm></au><au><snm>Rabinowicz</snm><fnm>PD</fnm></au><au><snm>Dedhia</snm><fnm>N</fnm></au><au><snm>McCombie</snm><fnm>WR</fnm></au><au><snm>Agier</snm><fnm>N</fnm></au><etal/></aug><source>PLoS Biol</source><pubdate>2007</pubdate><volume>5</volume><fpage>e174</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pbio.0050174</pubid><pubid idtype="pmcid">1892575</pubid><pubid idtype="pmpid" link="fulltext">17579518</pubid></pubidlist></xrefbib></bibl><bibl id="B33"><title><p>Does urea promote the bisulfite-mediated deamination of cytosine in DNA? Investigation aiming at speeding-up the procedure for DNA methylation analysis</p></title><aug><au><snm>Hayatsu</snm><fnm>H</fnm></au><au><snm>Tsuji</snm><fnm>K</fnm></au><au><snm>Negishi</snm><fnm>K</fnm></au></aug><source>Nucleic Acids Symp Ser</source><pubdate>2006</pubdate><volume>50</volume><fpage>69</fpage><lpage>70</lpage><xrefbib><pubid idtype="doi">10.1093/nass/nrl034</pubid></xrefbib></bibl><bibl id="B34"><title><p>SOAP2: an improved ultrafast tool for short read alignment</p></title><aug><au><snm>Li</snm><fnm>R</fnm></au><au><snm>Yu</snm><fnm>C</fnm></au><au><snm>Li</snm><fnm>Y</fnm></au><au><snm>Lam</snm><fnm>T-W</fnm></au><au><snm>Yiu</snm><fnm>S-M</fnm></au><au><snm>Kristiansen</snm><fnm>K</fnm></au><au><snm>Wang</snm><fnm>J</fnm></au></aug><source>Bioinformatics</source><pubdate>2009</pubdate><volume>25</volume><fpage>1966</fpage><lpage>1967</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btp336</pubid><pubid idtype="pmpid" link="fulltext">19497933</pubid></pubidlist></xrefbib></bibl><bibl id="B35"><title><p>The DNA methylome of human peripheral blood mononuclear cells</p></title><aug><au><snm>Li</snm><fnm>Y</fnm></au><au><snm>Zhu</snm><fnm>J</fnm></au><au><snm>Tian</snm><fnm>G</fnm></au><au><snm>Li</snm><fnm>N</fnm></au><au><snm>Li</snm><fnm>Q</fnm></au><au><snm>Ye</snm><fnm>M</fnm></au><au><snm>Zheng</snm><fnm>H</fnm></au><au><snm>Yu</snm><fnm>J</fnm></au><au><snm>Wu</snm><fnm>H</fnm></au><au><snm>Sun</snm><fnm>J</fnm></au></aug><source>PLoS Biology</source><pubdate>2010</pubdate><volume>8</volume><issue>11</issue><fpage>e1000533</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pbio.1000533</pubid><pubid idtype="pmcid">2976721</pubid><pubid idtype="pmpid" link="fulltext">21085693</pubid></pubidlist></xrefbib></bibl><bibl id="B36"><title><p>Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications</p></title><aug><au><snm>Krueger</snm><fnm>F</fnm></au><au><snm>Andrews</snm><fnm>SR</fnm></au></aug><source>Bioinformatics</source><pubdate>2011</pubdate><volume>27</volume><fpage>1571</fpage><lpage>1572</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btr167</pubid><pubid idtype="pmcid">3102221</pubid><pubid idtype="pmpid" link="fulltext">21493656</pubid></pubidlist></xrefbib></bibl><bibl id="B37"><title><p>BS Seeker: precise mapping for bisulfite sequencing</p></title><aug><au><snm>Chen</snm><fnm>PY</fnm></au><au><snm>Cokus</snm><fnm>S</fnm></au><au><snm>Pellegrini</snm><fnm>M</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2010</pubdate><volume>11</volume><fpage>203</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-11-203</pubid><pubid idtype="pmcid">2871274</pubid><pubid idtype="pmpid" link="fulltext">20416082</pubid></pubidlist></xrefbib></bibl><bibl id="B38"><title><p>The sequence alignment/map format and SAMtools</p></title><aug><au><snm>Li</snm><fnm>H</fnm></au><au><snm>Handsaker</snm><fnm>B</fnm></au><au><snm>Wysoker</snm><fnm>A</fnm></au><au><snm>Fennell</snm><fnm>T</fnm></au><au><snm>Ruan</snm><fnm>J</fnm></au><au><snm>Homer</snm><fnm>N</fnm></au><au><snm>Marth</snm><fnm>G</fnm></au><au><snm>Abecasis</snm><fnm>G</fnm></au><au><snm>Durbin</snm><fnm>R</fnm></au></aug><source>Bioinformatics</source><pubdate>2009</pubdate><volume>25</volume><fpage>2078</fpage><lpage>2079</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btp352</pubid><pubid idtype="pmcid">2723002</pubid><pubid idtype="pmpid" link="fulltext">19505943</pubid></pubidlist></xrefbib></bibl><bibl id="B39"><title><p>SOAP: short oligonucleotide alignment program</p></title><aug><au><snm>Li</snm><fnm>R</fnm></au><au><snm>Li</snm><fnm>Y</fnm></au><au><snm>Kristiansen</snm><fnm>K</fnm></au><au><snm>Wang</snm><fnm>J</fnm></au></aug><source>Bioinformatics</source><pubdate>2008</pubdate><volume>24</volume><fpage>713</fpage><lpage>714</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btn025</pubid><pubid idtype="pmpid" link="fulltext">18227114</pubid></pubidlist></xrefbib></bibl><bibl id="B40"><title><p>TopHat: discovering splice junctions with RNA-Seq</p></title><aug><au><snm>Trapnell</snm><fnm>C</fnm></au><au><snm>Pachter</snm><fnm>L</fnm></au><au><snm>Salzberg</snm><fnm>SL</fnm></au></aug><source>Bioinformatics</source><pubdate>2009</pubdate><volume>25</volume><fpage>1105</fpage><lpage>1111</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btp120</pubid><pubid idtype="pmcid">2672628</pubid><pubid idtype="pmpid" link="fulltext">19289445</pubid></pubidlist></xrefbib></bibl><bibl id="B41"><title><p>The neighbor-joining method: a new method for reconstructing phylogenetic trees</p></title><aug><au><snm>Saitou</snm><fnm>N</fnm></au><au><snm>Nei</snm><fnm>M</fnm></au></aug><source>Mol Biol Evol</source><pubdate>1987</pubdate><volume>4</volume><fpage>406</fpage><xrefbib><pubid idtype="pmpid" link="fulltext">3447015</pubid></xrefbib></bibl><bibl id="B42"><title><p>MEGA4: molecular evolutionary genetics analysis (MEGA) software version 4.0</p></title><aug><au><snm>Tamura</snm><fnm>K</fnm></au><au><snm>Dudley</snm><fnm>J</fnm></au><au><snm>Nei</snm><fnm>M</fnm></au><au><snm>Kumar</snm><fnm>S</fnm></au></aug><source>Molecular biology and evolution</source><pubdate>2007</pubdate><volume>24</volume><fpage>1596</fpage><lpage>1599</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/molbev/msm092</pubid><pubid idtype="pmpid" link="fulltext">17488738</pubid></pubidlist></xrefbib></bibl></refgrp>
   </bm>
</art>