<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1741-7007-5-28</ui>
   <ji>1741-7007</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>A 100%-complete sequence reveals unusually simple genomic features in the hot-spring red alga <it>Cyanidioschyzon merolae</it></p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Nozaki</snm>
               <fnm>Hisayoshi</fnm>
               <insr iid="I1"/>
               <email>nozaki@biol.s.u-tokyo.ac.jp</email>
            </au>
            <au id="A2">
               <snm>Takano</snm>
               <fnm>Hiroyoshi</fnm>
               <insr iid="I2"/>
               <email>takano@kumamoto-u.ac.jp</email>
            </au>
            <au id="A3">
               <snm>Misumi</snm>
               <fnm>Osami</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>misumi@tvr.rikkyo.ne.jp</email>
            </au>
            <au id="A4">
               <snm>Terasawa</snm>
               <fnm>Kimihiro</fnm>
               <insr iid="I5"/>
               <insr iid="I6"/>
               <email>kimitera@bio.c.u-tokyo.ac.jp</email>
            </au>
            <au id="A5">
               <snm>Matsuzaki</snm>
               <fnm>Motomichi</fnm>
               <insr iid="I1"/>
               <email>mzaki@biol.s.u-tokyo.ac.jp</email>
            </au>
            <au id="A6">
               <snm>Maruyama</snm>
               <fnm>Shinichiro</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>maruyama@biol.s.u-tokyo.ac.jp</email>
            </au>
            <au id="A7">
               <snm>Nishida</snm>
               <fnm>Keiji</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>keiji@platz.jp</email>
            </au>
            <au id="A8">
               <snm>Yagisawa</snm>
               <fnm>Fumi</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>z20022379@rikkyo.ne.jp</email>
            </au>
            <au id="A9">
               <snm>Yoshida</snm>
               <fnm>Yamato</fnm>
               <insr iid="I7"/>
               <insr iid="I4"/>
               <email>67524@ib.k.u-tokyo.ac.jp</email>
            </au>
            <au id="A10">
               <snm>Fujiwara</snm>
               <fnm>Takayuki</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>05ld010s@stu.rikkyo.ne.jp</email>
            </au>
            <au id="A11">
               <snm>Takio</snm>
               <fnm>Susumu</fnm>
               <insr iid="I8"/>
               <email>stakio@gpo.kumamoto-u.ac.jp</email>
            </au>
            <au id="A12">
               <snm>Tamura</snm>
               <fnm>Katsunori</fnm>
               <insr iid="I6"/>
               <email>ktamura@iam.u-tokyo.ac.jp</email>
            </au>
            <au id="A13">
               <snm>Chung</snm>
               <mnm>Jin</mnm>
               <fnm>Sung</fnm>
               <insr iid="I2"/>
               <insr iid="I10"/>
               <email>sjchung@kaeri.re.kr</email>
            </au>
            <au id="A14">
               <snm>Nakamura</snm>
               <fnm>Soichi</fnm>
               <insr iid="I9"/>
               <email>nsoichi@sci.u-ryukyu.ac.jp</email>
            </au>
            <au id="A15">
               <snm>Kuroiwa</snm>
               <fnm>Haruko</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>haruko-k@tvr.rikkyo.ne.jp</email>
            </au>
            <au id="A16">
               <snm>Tanaka</snm>
               <fnm>Kan</fnm>
               <insr iid="I6"/>
               <email>kntanaka@iam.u-tokyo.ac.jp</email>
            </au>
            <au id="A17">
               <snm>Sato</snm>
               <fnm>Naoki</fnm>
               <insr iid="I5"/>
               <email>naokisat@bio.c.u-tokyo.ac.jp</email>
            </au>
            <au id="A18">
               <snm>Kuroiwa</snm>
               <fnm>Tsuneyoshi</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>tsune@rikkyo.ne.jp</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Biological Sciences, Graduate School of Science, the University of Tokyo, Tokyo, Japan</p>
            </ins>
            <ins id="I2">
               <p>Graduate School of Science and Technology, Kumamoto University, Japan</p>
            </ins>
            <ins id="I3">
               <p>Department of Life Science, College of Science, Rikkyo (St. Paul's) University, Tokyo, Japan</p>
            </ins>
            <ins id="I4">
               <p>Research Information Center for Extremophile, Rikkyo (St. Paul's) University, Tokyo, Japan</p>
            </ins>
            <ins id="I5">
               <p>Department of Life Sciences, Graduate School of Arts and Sciences, the University of Tokyo, Tokyo, Japan</p>
            </ins>
            <ins id="I6">
               <p>Institute of Molecular and Cellular Biosciences, the University of Tokyo, Tokyo, Japan</p>
            </ins>
            <ins id="I7">
               <p>Department of Integrated Biosciences, Graduate School of Frontier Sciences, the University of Tokyo, Chiba, Japan</p>
            </ins>
            <ins id="I8">
               <p>Center for Marine Environment Studies, Kumamoto University, Kumamoto, Japan</p>
            </ins>
            <ins id="I9">
               <p>Laboratory of Cell and Functional Biology, Faculty of Science, University of the Ryukyus, Okinawa, Japan</p>
            </ins>
            <ins id="I10">
               <p>Radiation Research Center for Bio-Technology, Advanced Radiation Technology Institute, Korea Atomic Energy Research Institute, Jeollabuk-do, Korea</p>
            </ins>
         </insg>
         <source>BMC Biology</source>
         <issn>1741-7007</issn>
         <pubdate>2007</pubdate>
         <volume>5</volume>
         <issue>1</issue>
         <fpage>28</fpage>
         <url>http://www.biomedcentral.com/1741-7007/5/28</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17623057</pubid>
               <pubid idtype="doi">10.1186/1741-7007-5-28</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>31</day>
               <month>1</month>
               <year>2007</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>10</day>
               <month>7</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>10</day>
               <month>7</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Nozaki et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>All previously reported eukaryotic nuclear genome sequences have been incomplete, especially in highly repeated units and chromosomal ends. Because repetitive DNA is important for many aspects of biology, complete chromosomal structures are fundamental for understanding eukaryotic cells. Our earlier, nearly complete genome sequence of the hot-spring red alga <it>Cyanidioschyzon merolae </it>revealed several unique features, including just three ribosomal DNA copies, very few introns, and a small total number of genes. However, because the exact structures of certain functionally important repeated elements remained ambiguous, that sequence was not complete. Obviously, those ambiguities needed to be resolved before the unique features of the <it>C. merolae </it>genome could be summarized, and the ambiguities could only be resolved by completing the sequence. Therefore, we aimed to complete all previous gaps and sequence all remaining chromosomal ends, and now report the first nuclear-genome sequence for any eukaryote that is 100% complete.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Our present complete sequence consists of 16546747 nucleotides covering 100% of the 20 linear chromosomes from telomere to telomere, representing the simple and unique chromosomal structures of the eukaryotic cell. We have unambiguously established that the <it>C. merolae </it>genome contains the smallest known histone-gene cluster, a unique telomeric repeat for all chromosomal ends, and an extremely low number of transposons.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>By virtue of these attributes and others that we had discovered previously, <it>C. merolae </it>appears to have the simplest nuclear genome of the non-symbiotic eukaryotes. These unusually simple genomic features in the 100% complete genome sequence of <it>C. merolae </it>are extremely useful for further studies of eukaryotic cells.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The biological sciences have been embracing a new paradigm as a result of accruing genome information <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr></abbrgrp>. However, all previously reported eukaryotic nuclear genome sequences have been incomplete, especially in highly repeated units and chromosomal ends. Because repetitive DNA is essential to genome function <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>, and may contribute to the diversity of isoforms <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and the evolution of life <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, complete chromosomal structures are fundamental for understanding eukaryotic cells.</p>
         <p>Our recently published nuclear-genome sequence of the ultra-small, hot-spring red alga, <it>Cyanidioschyzon merolae </it>10D, revealed some unique features, such as very few introns, only three copies of ribosomal (r)DNA, and a small total number of genes <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>. However, because uncertainties remained regarding the features of certain important repeated elements, such as histone-gene clusters and telomeres <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, this sequence, like all previous eukaryotic nuclear-genome sequences, was incomplete. Given the functional significance of such elements <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>, it was obviously desirable to complete the sequence and resolve all ambiguities before attempting to summarize all of the unique features of the <it>C. merolae </it>genome. Therefore, we aimed to complete all previous gaps and sequenced all the remaining chromosomal ends, to construct the first nuclear genome sequence that is 100% complete. The results demonstrated that <it>C. merolae </it>possesses the simplest nuclear genome known among non-symbiotic eukaryotes.</p>
      </sec>
      <sec>
         <st>
            <p>Results and Discussion</p>
         </st>
         <sec>
            <st>
               <p>A 100%-complete genome sequence</p>
            </st>
            <p>Completing the nuclear genome sequence, from telomere to telomere, without gaps or ambiguities, required two distinct subprojects: (i) filling in all 46 previously existing gaps between contigs, and (ii) sequencing the 34 (of 40) chromosome ends that had not been sequenced previously by the shotgun method <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. Using PCR with sequence-specific primers to amplify portions of the <it>C. merolae </it>bacterial artificial chromosomes (BACs) that contained gap regions of interest, and then sequencing the resulting subclones, we have reduced the number of gaps between contigs from 46 to zero (Figure <figr fid="F1">1</figr>). A variety of methods (Additional files <supplr sid="S1">1</supplr>, <supplr sid="S2">2</supplr>) were then used to sequence all of the chromosomal ends that had not been sequenced previously (Figure <figr fid="F1">1</figr>). The global size of the 46 gaps that we have sequenced in this study is 46 469 base pairs. These sequences are G+C-rich (61%) compared with that of the whole nuclear genome (55%), and six of the 46 have extremely high G+C contents (70&#8211;76%). Furthermore, sequences corresponding to 13 previous gaps have extremely high nucleotide identity (99.4&#8211;100%) to other genomic regions. It turns out that the nuclear genomic sequence previously reported <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> contains misassembled and/or incorrect sequences of >20 kbp in total. The resulting complete genome sequence contains 16546747 base pairs and covers 100% of the chromosomal genome, from telomere to telomere. The numbers of base pairs in each of the 20 nuclear chromosomes are given in Table <tblr tid="T1">1</tblr>. These 20 linear nuclear chromosomes plus the two circular organellar DNA molecules <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp> comprise the entire genome of the organism, and contain 16728945 base pairs (Table <tblr tid="T1">1</tblr>).</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Supplementary methods</b>: Cloning and sequencing of terminal regions of all chromosomes, and complete determination of the histone cluster area in <it>C. merolae</it>.</p>
               </text>
               <file name="1741-7007-5-28-S1.doc">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p><b>Table 2</b>. Primers used for determination of terminal sequences of <it>C. merolae </it>chromosomes.</p>
               </text>
               <file name="1741-7007-5-28-S2.doc">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Bird's-eye view of the 100% complete structures of 20 <it>C. merolae </it>chromosomes</p>
               </caption>
               <text>
                  <p><b>Bird's-eye view of the 100% complete structures of 20 <it>C. merolae </it>chromosomes</b>. This shows regions that were filled in the present study ('Gap' and 'Chromosomal end'), telomere repeats, the histone cluster area, localization of transposable elements ('Class I' and 'Class II') and putative centromeric regions [9].</p>
               </text>
               <graphic file="1741-7007-5-28-1"/>
            </fig>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Key features of the 22 chromosomes constituting the three genomes of the hot-spring red alga <it>Cyanidioschyzon merolae </it>10D</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Genome/Chromosome</p>
                     </c>
                     <c ca="left">
                        <p>No. of nucleotides(bp)</p>
                     </c>
                     <c ca="left">
                        <p>Shape of chromosome</p>
                     </c>
                     <c ca="left">
                        <p>No. of protein-coding genes</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nucleus*</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>1</p>
                     </c>
                     <c ca="left">
                        <p>422 616</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>102</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>457 013</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>125</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>3</p>
                     </c>
                     <c ca="left">
                        <p>481 791</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>144</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>4</p>
                     </c>
                     <c ca="left">
                        <p>513 455</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>140</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>5</p>
                     </c>
                     <c ca="left">
                        <p>528 682</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>161</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>6</p>
                     </c>
                     <c ca="left">
                        <p>536 163</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>131</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>7</p>
                     </c>
                     <c ca="left">
                        <p>584 452</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>173</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>8</p>
                     </c>
                     <c ca="left">
                        <p>739 753</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>213</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>9</p>
                     </c>
                     <c ca="left">
                        <p>810 151</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>231</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>10</p>
                     </c>
                     <c ca="left">
                        <p>839 707</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>247</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>11</p>
                     </c>
                     <c ca="left">
                        <p>852 849</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>236</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>12</p>
                     </c>
                     <c ca="left">
                        <p>859 119</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>258</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>13</p>
                     </c>
                     <c ca="left">
                        <p>866 983</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>249</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>14</p>
                     </c>
                     <c ca="left">
                        <p>852 727</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>256</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>15</p>
                     </c>
                     <c ca="left">
                        <p>902 900</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>265</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>16</p>
                     </c>
                     <c ca="left">
                        <p>908 485</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>261</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>17</p>
                     </c>
                     <c ca="left">
                        <p>1 232 258</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>355</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>18</p>
                     </c>
                     <c ca="left">
                        <p>1 253 087</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>360</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>19</p>
                     </c>
                     <c ca="left">
                        <p>1 282 939</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>384</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>20</p>
                     </c>
                     <c ca="left">
                        <p>1 621 617</p>
                     </c>
                     <c ca="left">
                        <p>Linear</p>
                     </c>
                     <c ca="left">
                        <p>484</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="left">
                        <p>16 546 747</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>4 775</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Unassigned</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Plastid [17]</p>
                     </c>
                     <c ca="left">
                        <p>149 987</p>
                     </c>
                     <c ca="left">
                        <p>Circular</p>
                     </c>
                     <c ca="left">
                        <p>208</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Mitochondrion [16]</p>
                     </c>
                     <c ca="left">
                        <p>32 211</p>
                     </c>
                     <c ca="left">
                        <p>Circular</p>
                     </c>
                     <c ca="left">
                        <p>34</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total of 3 genomes</p>
                     </c>
                     <c ca="left">
                        <p>16 728 945</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>5 017</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Based on the present 100% nuclear genome sequence.</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Histone-gene cluster</p>
            </st>
            <p>The total number of histone genes varies greatly by species. Animal genomes typically have several hundred to several thousand histone genes organized as a set of tandemly repeating quintets of the five major histone gene types <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. In contrast, histone genes are located on more than one chromosome in some organisms, such as the ultra-small green alga <it>Ostreococcus </it><abbrgrp><abbr bid="B12">12</abbr></abbrgrp> and the flowering plant <it>Arabidopsis </it><abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. In our previous study, the complete organization of the histone cluster area in the <it>C. merolae </it>genome was left unresolved, because of several gaps within this region of sequence <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. However, our present complete sequence establishes that all <it>C. merolae </it>histone genes are localized on chromosome 14 and form a small cluster (around 48 kbp long) that includes two copies of the three core histone genes (<it>H2A</it>, <it>H2B </it>and <it>H4</it>), three copies of the <it>H3 </it>gene, and a single copy of the linker-histone <it>H1 </it>gene (Figure <figr fid="F2">2</figr>). In <it>Saccharomyces cerevisiae </it><abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, <it>Schizosaccharomyces pombe </it><abbrgrp><abbr bid="B6">6</abbr></abbrgrp>, <it>Dictyostelium discoideum </it><abbrgrp><abbr bid="B11">11</abbr></abbrgrp>, <it>Encephalitozoon cuniculi </it><abbrgrp><abbr bid="B5">5</abbr></abbrgrp> and <it>Ostreococcus tauri </it><abbrgrp><abbr bid="B12">12</abbr></abbrgrp> the histone genes also exhibit small copy numbers (up to three), as in <it>C. merolae</it>, but they are dispersed across more than two chromosomes. Thus, the <it>C. merolae </it>histone genes are present in the most compact cluster yet described.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Strategy for finishing the analysis of the <it>C. merolae </it>histone gene cluster on chromosome 14, and a map of histone genes resolved within the cluster</p>
               </caption>
               <text>
                  <p><b>Strategy for finishing the analysis of the <it>C. merolae </it>histone gene cluster on chromosome 14, and a map of histone genes resolved within the cluster</b>. The black and the white squares in genes represent CDS and 5'-/3'-untranslated regions, respectively. H4-a, histone H4-a; H2B-a, histone H2B-a; ADF, actin-depolymerizing factor; S/TPK, RIO-like serine/threonine protein kinase; 40S-S13, 40S ribosomal protein S13; H3-b, histone H3-b; PTR, possible transcribed region; H2A-b, histone H2A-b; H3-c, histone H3-c; TIM50, mitochondrial preseqence translocase subunit Tim50; BAT, brabched-chain-amino-acid transaminase, mitochondrial precursor; H1, histone H1; ASM, similar to N6-adenine-specific methylase; Hyp, hypothetical transcript; TPR, hypothetical protein, conserved (containing tetratricopeptide repeats); CAB-CP24, similar to chlorophyll a/b-binding protein, CP24; H2B-b, histone H2B-b; Hyp, hypothetical protein; H4-b, histone H4-b.</p>
               </text>
               <graphic file="1741-7007-5-28-2"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Telomeres and subtelomeric regions</p>
            </st>
            <p>Whole-genome shotgun sequencing suggested that the repeat unit in <it>C. merolae </it>telomeres is AATGGGGGG <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, but in that study only six of the 40 chromosome ends were examined <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> (Figure <figr fid="F1">1</figr>). Here the sequencing of all remaining termini confirmed that AATGGGGGG is the telomere repeat sequence in all <it>C. merolae </it>chromosomal ends. In most plants, the telomeres are composed of many copies of the sequence TTTAGGG <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>, and the <it>C. merolae </it>telomere sequence, AATGGGGGG, has never yet been found elsewhere.</p>
            <p>Telomere length varies among plants from approximately 0.5 kbp in the green alga <it>Chlorella vulgaris </it>to 150 kbp in tobacco <abbrgrp><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp>. Telomere restriction fragment analyses using the (CCCCCCATT)3 probe revealed AATGGGGGG repeats varying from 400 to 700 bp in the total chromosomal ends in the <it>C. merolae </it>genome (data not shown). Our Southern blot analysis using a specific genomic probe suggested that <it>C. merolae </it>chromosome 15 has around a 400-bp telomere repeat sequence at the left end (see Additional file <supplr sid="S3">3</supplr>). However, the longest telomeric repeats that could be sequenced in this study were 2.5 repeats (AATGGGGGGAATGGGGGGAATGGG) in the right end of chromosome 1, possibly because long stretches of AATGGGGGG repeats are difficult to clone or sequence using conventional techniques used in this and previous studies <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>.</p>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Figure 5</b>. Telomere length analyses. (<b>A</b>) Southern hybridisation using the probe specific for the left arm of chromosome 15, demonstrating that the left end of chromosome 15 was detected using genomic DNA digested with each enzyme. H, Sa and Sp indicate genomic DNA digested with <it>Hin</it>dIII, <it>Sal</it>I and <it>Sph</it>I, respectively. (<b>B</b>) Comparison of the detected signal size with the fragment size estimated from the genome sequences.</p>
               </text>
               <file name="1741-7007-5-28-S3.doc">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The putative telomerase catalytic subunit, telomerase reverse transcriptase (TERT) is transcribed (CMD110C) in <it>C. merolae </it><abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. In the <it>C. merolae </it>genome, we found two possible telomerase RNA subunit genes in chromosomes 13 and 16, based on two transcripts, CMM123T and CMP131T, which included UUCCCCCCAUU and CCAUUCCCCCCAUU sequences, respectively. The telomerase RNA template sequence (CCCCCCAUU) has been detected in only these two hypothetical non-coding RNA genes among all the predicted genes in the present 100% complete nuclear genome. These are the first convincing candidate telomerase-RNA subunit genes in plant and algal lineages.</p>
            <p>Based on the end sequencing of all 40 chromosomal termini completed here, all of the subtelomeric regions in the <it>C. merolae </it>nuclear genome have been unveiled (Figure <figr fid="F3">3</figr>). Eight types of homologous DNA elements (up to 20 kbp), with unique gene contents, were found adjacent to the telomere repeats in the 40 chromosomal ends (Figure <figr fid="F3">3</figr>). Two of the eight types exist in only two ends; element H for 3L (left end of chromosome 3) and 16R, and element L for 3R and 11R. PH elements are the most frequent and are recognized in 6L, 7R, 8L, 8R, 11L, 14R, 18R and 19R, whereas nine termini (namely, 2L, 6R, 12R, 13L, 13R, 15L, 15R, 16L and 20R) showed no homology to other terminal regions. This situation is different from that of <it>S. cerevisiae</it>, in which core X elements exist in all chromosomal ends <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. In the ultrasmall, obligate intracellular parasite <it>E. cuniculi </it>(Microsporidia) <abbrgrp><abbr bid="B5">5</abbr></abbrgrp> and the nucleomorphs (the reduced nuclei of the eukaryotic endosymbionts) of the cryptophyte <it>Guillardia theta </it>and chlorarachniophyte <it>Bigelowiella natans </it><abbrgrp><abbr bid="B25">25</abbr><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr></abbrgrp>, both of the subtelomeric regions of all chromosomes harbor rRNA genes. However, such features are not recognized in <it>Cyanidioschyzon </it>(Figures <figr fid="F1">1</figr>, <figr fid="F3">3</figr>) and the ultra-small green <it>Ostreococcus </it><abbrgrp><abbr bid="B12">12</abbr></abbrgrp>, and thus seem to represent some evolutionary convergence resulting from the intracellular parasitism or endosymbiosis in <it>E. cuniculi </it>and the nucleomorphs.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Complete gene contents at the terminal regions of <it>C. merolae </it>chromosomes</p>
               </caption>
               <text>
                  <p><b>Complete gene contents at the terminal regions of <it>C. merolae </it>chromosomes</b>. T, P, L, H, C, F, E, A, O, D, R, I and M represent genes for the trefoil factor, NADPH:protochlorophyllide oxidoreductase, L-lactate dehydrogenase, hedgehog protein, subunit 6a of chaperonin containing TCP1, subunit ATP5 of F<sub>1</sub>F<sub>O </sub>ATP synthase, ubiquitin conjugating enzyme E2, copper-containing amine oxidase, anion transporter, dTDP-glucose 4,6-dehydratase, dTDP-4-dehydrorhamnose reductase, iron permease, and dolichyl-phosphate-mannose:protein mannosyltransferase, respectively. Detailed information is available on the <it>C. merolae </it>Genome Project website <url>http://merolae.biol.s.u-tokyo.ac.jp/</url>. Homologous DNA elements are shown as red lines with designations.</p>
               </text>
               <graphic file="1741-7007-5-28-3"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Transposable elements</p>
            </st>
            <p>The number of transposable elements in various eukaryotes differs widely <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>, and of all the non-symbiotic and non-pathogenic eukaryotes previously studied, yeast and pufferfish have the fewest: about 3% of the genome <abbrgrp><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>. However, transposons constitute only about 0.7% of the <it>C. merolae </it>genome (by assuming that the average gene size of RT- and transposase-related elements are 4 kbp and 3 kbp, respectively). The completed <it>C. merolae </it>genome sequence contains only 26 class I elements (retrotransposons) and eight class II elements (transposons) <abbrgrp><abbr bid="B31">31</abbr></abbrgrp> (Figure <figr fid="F1">1</figr>). The transcripts of three of the 26 retrotransposons contained an intact reverse transcriptase open-reading frame, and a BLASTX search suggested that all 26 of the retrotransposons were most closely related to non-long terminal repeat (non-LTR) retrotransposons. So, although LTR retrotransposons are widely distributed in plants and animals <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>, we could not find any of them in the <it>C. merolae </it>genome. All eight of the transposase-related elements of <it>C. merolae </it>were most closely related (E-value = 0.071&#8211;6 &#215; 10<sup>-7</sup>) to transposase sequences of bacterial transposons. In short, <it>C. merolae </it>is one of the two non-symbiotic eukaryotes with an extremely low abundance of transposable elements (Table <tblr tid="T2">2</tblr>). In the endosymbiotic reduced eukaryotes, <it>Encephalitozoon cuniculi </it>and nucleomorphs <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B25">25</abbr><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr></abbrgrp>, however, transposable elements seem lacking in chromosomes.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Comparison of the nuclear genomes of <it>Cyanidioschyzon</it>, <it>Ostreococcus </it>(an ultra-small green alga), <it>Arabidopsis </it>(a flowering plant) and <it>Ashbya </it>(a filamentous fungal pathogen).</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="left">
                        <p>
                           <b>Organism</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>No. of protein-coding genes</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Genes with introns (%)</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>No. of rRNA gene units</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>No. of chromosomes with histone genes</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Transposable elements in genome (%)</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Telomere repeat sequences</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>Arabidopsis</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>26207</p>
                     </c>
                     <c ca="left">
                        <p>79</p>
                     </c>
                     <c ca="left">
                        <p>~800</p>
                     </c>
                     <c ca="left">
                        <p>5&#8804;</p>
                     </c>
                     <c ca="left">
                        <p>~15</p>
                     </c>
                     <c ca="left">
                        <p>TTTAGGG</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>Ostreococcus</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>8166</p>
                     </c>
                     <c ca="left">
                        <p>39</p>
                     </c>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="left">
                        <p>6&#8804;</p>
                     </c>
                     <c ca="left">
                        <p>~10</p>
                     </c>
                     <c ca="left">
                        <p>TTTAGGG</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>Cyanidioschyzon</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>4775</p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>0.5</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>3</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>1</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>0.7</p>
                     </c>
                     <c ca="left">
                        <p>AATGGGGGG</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <it>Ashbya</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>4718</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="left">
                        <p>~50</p>
                     </c>
                     <c ca="left">
                        <p>4&#8804;</p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>0.1></b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>CGCTGAGAGACCCATACACCACAC</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Bold type indicates the smallest number in non-symbiotic eukaryotes.</p>
                  <p>Two non-symbiotic eukaryotes, <it>Schizosaccharomyces pombe </it>and the filamentous fungus <it>Ashbya gossypii</it>, have nuclear protein-coding genes that are as small in number as those of <it>C. merolae</it>.</p>
                  <p>The number of protein-coding genes in the nuclear genome of <it>S. pombe </it>[6] increased to 5004 <url>http://www.sanger.ac.uk/Projects/S_pombe/genome_stats.shtml</url>.</p>
                  <p>Although <it>A. gossypii </it>was reported to contain 4718 protein-coding nuclear genes [13], the genome project of this fungus is now in progress <url>http://agd.unibas.ch/</url>; thus it possibly contains more than 4775 protein-coding genes.</p>
               </tblfn>
            </tbl>
            <p>In contrast to this, 253 copies of a novel interspersed repetitive element were found in the <it>C. merolae </it>genome. All copies have a truncated ORF that is weakly related (BLASTX E-value = 10<sup>-5</sup>-4 &#215; 10<sup>-2</sup>) to a putative protein, WSV486, that is encoded in the genome of the shrimp spot syndrome virus <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. These repetitive elements have an average size of 3.2 kbp, are distributed randomly on all chromosomes, and altogether comprise about 5% of the genome. Because these elements exhibit transcriptional activity <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, they may contribute to genomic or cellular functions in <it>C. merolae </it>in the same manner as repetitive DNA does in other eukaryotes <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>The smallest known histone-gene cluster, a unique telomeric repeat, a very low density of transposable elements, and other previously described simple features of the <it>C. merolae </it>nuclear genome <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp> (Table <tblr tid="T2">2</tblr>) are very distinctive, and constitute the simplest set of genomic features found in any non-symbiotic eukaryote yet studied. Such simple features are generally considered to result from consequences of reductive evolution of an ultra-small eukaryote <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. However, none of these features is shared by the similarly ultra-small green alga, <it>Ostreococcus</it>, in which 39% of the genes contain introns, histone genes are dispersed across at least six chromosomes, and 417 transposable elements and 8166 protein-coding genes are distributed among the chromosomes <abbrgrp><abbr bid="B12">12</abbr></abbrgrp> (see Table <tblr tid="T2">2</tblr>). These may suggest differences in modes of genome reduction between ancestors of <it>Cyanidioschyzon </it>(red algae) and <it>Ostreococcus </it>(green plants). On the other hand, algae living in acidic hot springs (pH 1.5, 45&#176;C) might be candidates for retaining ancient plant attributes, because the volcano activity is thought to have been providing such an extreme environment throughout Earth's history. Very recently, Cunningham <it>et al </it><abbrgrp><abbr bid="B33">33</abbr></abbrgrp> reported that <it>C. merolae </it>contains perhaps the simplest assortment of chlorophylls and carotenoids found in any eukaryotic photosynthetic organism. In addition, the <it>C. merolae </it>plastid genome contains a large number of genes, which is thought to be a primitive feature, because reversal of plastid-gene loss is generally considered to be impossible <abbrgrp><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr></abbrgrp>. Thus, our hypothesis is that some of the unusual or simple genomic characteristics of <it>C. merolae </it>may represent primitive features that have been conserved in <it>Cyanidioschyzon</it>, but have become extensively modified during the evolution of other plant lineages. Alternatively, the unique genomic features of <it>C. merolae </it>(Table <tblr tid="T2">2</tblr>) may reflect adaptation to the extreme environment. However, genome information for other hot-spring red algae is very limited. The recently released nuclear genome sequence of another hot-spring red alga <it>Galdieria </it>has not revealed the chromosomal structures of its components, such as rDNA units or histone cluster area. <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. Further information on the complete nuclear genomes of other plants, including other hot-spring red algae, red macro-algae, and other members of plant and algal lineages, will be needed to determine whether <it>C. merolae </it>actually has primitive genomic features.</p>
         <p>Three kinds of genomes are found in many eukaryotic cells: nuclear, mitochondrial, and plastid <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. Based on the present nuclear genome data and the previously published mitochondrial and plastid genome sequences <abbrgrp><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>, all major types of eukaryotic genetic information are present in <it>C. merolae</it>. In addition, as revealed by the present 100% complete genome, <it>C. merolae </it>contains unusually simple sets of genes and sequences (Table <tblr tid="T2">2</tblr>). For example, because almost all protein-coding nuclear genes of <it>C. merolae </it>lack introns (Table <tblr tid="T2">2</tblr>), the complete sequence of the genome provided here can be used directly to deduce the sequences of all of its proteins, which will make it extremely valuable for future proteomics research. Therefore, <it>C. merolae </it>represents an ideal model organism for studying the fundamental relationships among the chloroplast, mitochondrial and nuclear of genomes. The complete nuclear genome sequence reported here will greatly improve the precision of biological analyses of <it>C. merolae</it>, including studies of chromosome structure and gene structure/annotation. Furthermore, because <it>C. merolae </it>inhabits hot springs (45&#176;C) <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, most of its proteins must be unusually heat-stable, and so its proteome may well provide important new insights into the structural basis for heat stability of proteins.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Filling gaps between contigs/fragments</p>
            </st>
            <p>Previously constructed <it>C. merolae </it>BAC clones <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> were used for filling in previously existing gaps between contigs. PCRs of BAC clones containing unsequenced regions were carried out using <it>Taq </it>polymerase with GC buffer (Takara LA Taq; Takara Bio Inc., Osaka, Japan) and specific primers complementary to sequences flanking the gaps. DNA walking annealing control primer technology (DNA Walking SpeedUp&#8482; Kit; Seegene, Seoul, Korea) was also used to directly amplify unknown sequences adjacent to known sequences within a contig. PCR products were sequenced by cycle sequencing (Big-Dye Terminator Cycle Sequencing Kit v 3.1; Applied Biosystems, Foster City, CA, USA), except for a single gap in chromosome 10, which was filled by a sequencing reaction performed using <it>in vitro </it>transcription (CUGA Sequencing Kit; Nippon Genetech Co., Ltd., Tokyo, Japan).</p>
         </sec>
         <sec>
            <st>
               <p>Sequencing of each chromosomal end</p>
            </st>
            <p>PolyC-tailing and the anchor primer method, the inverse PCR method and the asymmetric PCR method were used for sequencing the ends of chromosomes. For details, see Additional files <supplr sid="S1">1</supplr> and <supplr sid="S2">2</supplr>.</p>
         </sec>
         <sec>
            <st>
               <p>Assembling sequence data and gene annotation</p>
            </st>
            <p>Assembling of sequence data and two strategies for gene prediction have been described previously <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Complete determination of the histone cluster area</p>
            </st>
            <p>To determine the complete sequences of the histone cluster area in the <it>C. merolae </it>genome, we carried out <it>Not</it>I and <it>Apa</it>I subcloning of the BAC clone GESZ2-b20, which included possible histone clusters in chromosome 14 <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. Restriction-enzyme analysis, Southern blot analysis with histone-related probes and end sequencing of the subclones revealed relative positions of the subclones on chromosome 14 (Figure <figr fid="F2">2</figr>). Six gaps between contigs/fragments in the histone cluster area <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> were filled using primer walking of the subclones. For details, see Additional files <supplr sid="S1">1</supplr> and <supplr sid="S4">4</supplr>.</p>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p><b>Table 3</b>. Primers used for completing the <it>C. merolae </it>histone cluster area.</p>
               </text>
               <file name="1741-7007-5-28-S4.doc">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Accession numbers</p>
            </st>
            <p>The 100% chromosome sequences are accessible under the DDBJ with accession numbers <ext-link ext-link-type="ddbj" ext-link-id="AP006483">AP006483</ext-link>&#8211;<ext-link ext-link-type="ddbj" ext-link-id="AP006502">AP006502</ext-link> (chromosome 1&#8211;20). Sequences and annotation are available at <url>http://merolae.biol.s.u-tokyo.ac.jp/</url>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>HN, OM, KN, FY, YY, TF, SN, HK and TK performed filling contig gaps. HT, SM, KatT, SJC and KanT determined the chromosomal ends. KiT and NS completed the histone cluster area. MM and OM assembled the sequence data. ST analysed the transposable elements. All authors discussed the results and commented on the manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank Professor D. L. Kirk (Washington University) for critically reading the manuscript. This work was supported by Grant-in-Aid for Creative Scientific Research (No. 16GS0304 to KanT, NS and HN) and Grant-in-Aid for Scientific Research (No. 17370087 to HN), from the Ministry of Education, Culture, Sports, Science and Technology of Japan; and by grants from Frontier Project "Adaptation and Evolution of Extremophile" (to TK) from the Ministry of Education, Culture, Sports, Science and Technology of Japan, and from the Program for the Promotion of Basic Research Activities for Innovative Biosciences (PROBRAIN to TK).</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Life with 6000 genes</p>
            </title>
            <aug>
               <au>
                  <snm>Goffeau</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>BG</fnm>
               </au>
               <au>
                  <snm>Bussey</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>RW</fnm>
               </au>
               <au>
                  <snm>Dujon</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Feldmann</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Galibert</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Hoheisel</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Jacq</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Johnston</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Louis</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Murakami</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Philippsen</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Tettelin</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Oliver</snm>
                  <fnm>SG</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1996</pubdate>
            <volume>274</volume>
            <fpage>563</fpage>
            <lpage>567</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1126/science.274.5287.546</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p><it>Saccharomyces </it>Genome Database (SGD) provides tools to identify and analyze sequences from <it>Saccharomyces cerevisiae </it>and related sequences from other organisms</p>
            </title>
            <aug>
               <au>
                  <snm>Christie</snm>
                  <fnm>KR</fnm>
               </au>
               <au>
                  <snm>Weng</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Balakrishnan</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Costanzo</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Dolinski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Dwight</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Engel</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Feierbach</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Fisk</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Hirschman</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Hong</snm>
                  <fnm>EL</fnm>
               </au>
               <au>
                  <snm>Issel-Tarver</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Nash</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sethuraman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Starr</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Theesfeld</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Andrada</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Binkley</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Lane</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Schroeder</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Botstein</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Cherry</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Nucl Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>D311</fpage>
            <lpage>D314</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308767</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681421</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh033</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Genome sequence of the nematode <it>C. elegans</it>: a platform for investigating biology</p>
            </title>
            <aug>
               <au>
                  <cnm><it>C. elegans </it>Sequencing Consortium</cnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1998</pubdate>
            <volume>282</volume>
            <fpage>1012</fpage>
            <lpage>1018</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1126/science.282.5396.2012</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Analysis of the genome sequence of the flowering plant <it>Arabidopsis thaliana</it></p>
            </title>
            <aug>
               <au>
                  <cnm><it>Arabidopsis </it>Genome Initiative</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>408</volume>
            <fpage>796</fpage>
            <lpage>815</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35048692</pubid>
                  <pubid idtype="pmpid" link="fulltext">11130711</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Genome sequence and gene compaction of the eukaryote parasite <it>Encephalitozoon cuniculi</it></p>
            </title>
            <aug>
               <au>
                  <snm>Katinka</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Duprat</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cornillot</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Metenier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Thomarat</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Prensier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Barbe</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Peyretaillade</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Brottier</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Delbac</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>El Alaoui</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Peyret</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Saurin</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gouy</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Weissenbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Vivares</snm>
                  <fnm>CP</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2001</pubdate>
            <volume>414</volume>
            <issue>6862</issue>
            <fpage>450</fpage>
            <lpage>453</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35106579</pubid>
                  <pubid idtype="pmpid" link="fulltext">11719806</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>The genome sequence of <it>Schizosaccharomyces pombe</it></p>
            </title>
            <aug>
               <au>
                  <snm>Wood</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Gwilliam</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Rajandream</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Lyne</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lyne</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Stewart</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sgouros</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Peat</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Hayles</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Baker</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Basham</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Bowman</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Brooks</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Chillingworth</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Churcher</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Collins</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Connor</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Cronin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Feltwell</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gentles</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Goble</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hamlin</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hidalgo</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hodgson</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Holroyd</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hornsby</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Howarth</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Huckle</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Hunt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Jagels</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>James</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Leather</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>McDonald</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>McLean</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Mooney</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Moule</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Murphy</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Niblett</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Odell</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Oliver</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>O'Neil</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Pearson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Quail</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Rabbinowitsch</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Rutherford</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Rutter</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Saunders</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Seeger</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Sharp</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Skelton</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Simmonds</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Squares</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Squares</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Stevens</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Tivey</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Walsh</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Warren</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Whitehead</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Woodward</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Volckaert</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Aert</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Robben</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Grymonprez</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Weltjens</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Vanstreels</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Rieger</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Schafer</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Muller-Auer</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gabel</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Fuchs</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Dusterhoft</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Fritzc</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Holzer</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Moestl</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hilbert</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Borzym</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Langer</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Beck</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lehrach</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Reinhardt</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Pohl</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Eger</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Zimmermann</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wedler</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wambutt</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Purnelle</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Goffeau</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cadieu</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Dreano</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gloux</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lelaure</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Mottier</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Galibert</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Aves</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Xiang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Hunt</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Hurst</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rochet</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gaillardin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Tallada</snm>
                  <fnm>VA</fnm>
               </au>
               <au>
                  <snm>Garzon</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Thode</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Daga</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Cruzado</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jimenez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sanchez</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>del Rey</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Benito</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Dominguez</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Revuelta</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Moreno</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Armstrong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Forsburg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Cerutti</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>McCombie</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>Paulsen</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Potashkin</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Shpakovski</snm>
                  <fnm>GV</fnm>
               </au>
               <au>
                  <snm>Ussery</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>BG</fnm>
               </au>
               <au>
                  <snm>Nurse</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2002</pubdate>
            <volume>415</volume>
            <fpage>871</fpage>
            <lpage>880</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature724</pubid>
                  <pubid idtype="pmpid" link="fulltext">11859360</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Finishing a whole-genome shotgun: release 3 of the <it>Drosophila melanogaster </it>euchromatic genome sequence</p>
            </title>
            <aug>
               <au>
                  <snm>Celniker</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Wheeler</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Kronmiller</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Patel</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Champe</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Dugan</snm>
                  <fnm>SP</fnm>
               </au>
               <au>
                  <snm>Frise</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hodgson</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>George</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Hoskins</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Laverty</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Muzny</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>CR</fnm>
               </au>
               <au>
                  <snm>Pacleb</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Pfeiffer</snm>
                  <fnm>BD</fnm>
               </au>
               <au>
                  <snm>Richards</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sodergren</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Svirskas</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tabor</snm>
                  <fnm>PE</fnm>
               </au>
               <au>
                  <snm>Wan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Stapleton</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Weinstock</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Scherer</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Gibbs</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Rubin</snm>
                  <fnm>GM</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2002</pubdate>
            <volume>3</volume>
            <fpage>research0079.1</fpage>
            <lpage>0079.14</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1186/gb-2002-3-12-research0079</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Finishing the euchromatic sequence of the human genome</p>
            </title>
            <aug>
               <au>
                  <cnm>International Human Genome Sequencing Consortium</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>431</volume>
            <fpage>931</fpage>
            <lpage>945</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03001</pubid>
                  <pubid idtype="pmpid" link="fulltext">15496913</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Genome sequence of the ultra-small unicellular red alga <it>Cyanidioschyzon merolae </it>10D</p>
            </title>
            <aug>
               <au>
                  <snm>Matsuzaki</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Misumi</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Shin-i</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Maruyama</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Takahara</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Miyagishima</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mori</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nishida</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Yagisawa</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Yoshida</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Nishimura</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Nakao</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kobayashi</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Momoyama</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Higashiyama</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Minoda</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sano</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nomoto</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Oishi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Hayashi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Ohta</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Nishizaka</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Haga</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Miura</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Morishita</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Kabeya</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Terasawa</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Ishii</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Asakawa</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Takano</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Ohta</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Tanaka</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Shimizu</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sugano</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Ogasawara</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kohara</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>428</volume>
            <fpage>653</fpage>
            <lpage>657</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature02398</pubid>
                  <pubid idtype="pmpid" link="fulltext">15071595</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p><it>Cyanidioschyzon merolae </it>genome. A tool for facilitating comparable studies on organelle biogenesis in photosynthetic eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Misumi</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Matsuzaki</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Miyagishima</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mori</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nishida</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Yagisawa</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Yoshida</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Plant Physiol</source>
            <pubdate>2005</pubdate>
            <volume>137</volume>
            <fpage>567</fpage>
            <lpage>585</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1065357</pubid>
                  <pubid idtype="pmpid" link="fulltext">15681662</pubid>
                  <pubid idtype="doi">10.1104/pp.104.053991</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The genome of the social amoeba <it>Dictyostelium discoideum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Eichinger</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Pachebat</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Glockner</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Rajandream</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Sucgang</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Berriman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Song</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Olsen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Szafranski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Tunggal</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kummerfeld</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Madera</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Konfortov</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Rivero</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Bankier</snm>
                  <fnm>AT</fnm>
               </au>
               <au>
                  <snm>Lehmann</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hamlin</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Davies</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Gaudet</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Fey</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Pilcher</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Saunders</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Sodergren</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Kerhornou</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Nie</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Anjard</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hemphill</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Bason</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Farbrother</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Desany</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Just</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Morio</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Rost</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Churcher</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Haydock</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>van Driessche</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Cronin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Goodhead</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Muzny</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mourier</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Pain</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Harper</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Lindsay</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hauser</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>James</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Quiles</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Madan Babu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Saito</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Buchrieser</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wardroper</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Felder</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Thangavelu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Knights</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Loulseged</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Oliver</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Price</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Quail</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Urushihara</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Hernandez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Rabbinowitsch</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Steffen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Sanders</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kohara</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Sharp</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Simmonds</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Spiegler</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tivey</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sugano</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Walker</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Woodward</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Winckler</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Tanaka</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Shaulsky</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Schleicher</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Weinstock</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Rosenthal</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cox</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Chisholm</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Gibbs</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Loomis</snm>
                  <fnm>WF</fnm>
               </au>
               <au>
                  <snm>Platzer</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kay</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Dear</snm>
                  <fnm>PH</fnm>
               </au>
               <au>
                  <snm>Noegel</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kuspa</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2005</pubdate>
            <volume>435</volume>
            <fpage>43</fpage>
            <lpage>57</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1352341</pubid>
                  <pubid idtype="pmpid" link="fulltext">15875012</pubid>
                  <pubid idtype="doi">10.1038/nature03481</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Genome analysis of the smallest free-living eukaryote <it>Ostreococcus tauri </it>unveils many unique features</p>
            </title>
            <aug>
               <au>
                  <snm>Derelle</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Ferraz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Rombauts</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rouze</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Worden</snm>
                  <fnm>AZ</fnm>
               </au>
               <au>
                  <snm>Robbens</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Partensky</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Degroeve</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Echeynie</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cooke</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Saeys</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Wuyts</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Jabbari</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Bowler</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Panaud</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Piegu</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ball</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>Ral</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Bouget</snm>
                  <fnm>FY</fnm>
               </au>
               <au>
                  <snm>Piganeau</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>De Baets</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Picard</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Delseny</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Demaille</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Van de Peer</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Moreau</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>11647</fpage>
            <lpage>11652</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1544224</pubid>
                  <pubid idtype="pmpid" link="fulltext">16868079</pubid>
                  <pubid idtype="doi">10.1073/pnas.0604795103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p><it>Ashbya </it>Genome Database 3.0: a cross-species genome and transcriptome browser for yeast biologists</p>
            </title>
            <aug>
               <au>
                  <snm>Gattiker</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rischatsch</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Demougin</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Voegeli</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dietrich</snm>
                  <fnm>FS</fnm>
               </au>
               <au>
                  <snm>Philippsen</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Primig</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>BMC Genomics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>9</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1779777</pubid>
                  <pubid idtype="pmpid" link="fulltext">17212814</pubid>
                  <pubid idtype="doi">10.1186/1471-2164-8-9</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Why repetitive DNA is essential to genome function</p>
            </title>
            <aug>
               <au>
                  <snm>Shapiro</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>von Sternberg</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Biol Rev</source>
            <pubdate>2005</pubdate>
            <volume>80</volume>
            <fpage>227</fpage>
            <lpage>250</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1017/S1464793104006657</pubid>
                  <pubid idtype="pmpid">15921050</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p><it>Drosophila </it>Dscam is an axon guidance receptor exhibiting extraordinary molecular diversity</p>
            </title>
            <aug>
               <au>
                  <snm>Schmucker</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Clemens</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Shu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Worby</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Xiao</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Muda</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Dixon</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Zipursky</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2000</pubdate>
            <volume>101</volume>
            <fpage>671</fpage>
            <lpage>684</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(00)80878-8</pubid>
                  <pubid idtype="pmpid" link="fulltext">10892653</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Evolution by Gene Duplication</p>
            </title>
            <aug>
               <au>
                  <snm>Ohno</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <publisher>Springer Verlag, Berlin, Germany</publisher>
            <pubdate>1970</pubdate>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Structure and organization of the mitochondrial genome of the unicellular red alga <it>Cyanidioschyzon merolae </it>deduced from the complete nucleotide sequence</p>
            </title>
            <aug>
               <au>
                  <snm>Ohta</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1998</pubdate>
            <volume>26</volume>
            <fpage>5190</fpage>
            <lpage>5298</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">147977</pubid>
                  <pubid idtype="pmpid" link="fulltext">9801318</pubid>
                  <pubid idtype="doi">10.1093/nar/26.22.5190</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Complete sequence and analysis of the plastid genome of the unicellular red alga <it>Cyanidioschyzon merolae</it></p>
            </title>
            <aug>
               <au>
                  <snm>Ohta</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Matsuzaki</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Misumi</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Miyagishima</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Tanaka</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Shin-i</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Kohara</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>DNA Res</source>
            <pubdate>2003</pubdate>
            <volume>10</volume>
            <fpage>67</fpage>
            <lpage>77</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/dnares/10.2.67</pubid>
                  <pubid idtype="pmpid" link="fulltext">12755171</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Histone messengers and histone genes</p>
            </title>
            <aug>
               <au>
                  <snm>Kedes</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Ann Rev Biochem</source>
            <pubdate>1979</pubdate>
            <volume>28</volume>
            <fpage>837</fpage>
            <lpage>870</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1146/annurev.bi.48.070179.004201</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Molecular evolution of the nontandemly repeated genes of the histone 3</p>
            </title>
            <aug>
               <au>
                  <snm>Rooney</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Piontkivska</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Nei</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2002</pubdate>
            <volume>19</volume>
            <fpage>68</fpage>
            <lpage>75</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11752191</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Telomere structure, function and maintenance in <it>Arabidopsis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Riha</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Shippen</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>Chromosome Res</source>
            <pubdate>2003</pubdate>
            <volume>11</volume>
            <fpage>263</fpage>
            <lpage>275</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1023/A:1022892010878</pubid>
                  <pubid idtype="pmpid" link="fulltext">12769293</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Molecular organization of <it>Chlorella vulgaris </it>chromosomes I; presence of telomeric repeats that are conserved in higher plants</p>
            </title>
            <aug>
               <au>
                  <snm>Higashiyama</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Maki</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Yamada</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Mol Gen Genet</source>
            <pubdate>1995</pubdate>
            <volume>246</volume>
            <fpage>29</fpage>
            <lpage>36</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF00290130</pubid>
                  <pubid idtype="pmpid">7823910</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Organization of telomeric and subtelomeric chromatin in the higher plant <it>Nicotiana tabacum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Fajkus</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kovar&#237;k</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kr&#225;lovics</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Bezd&#277;k</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Gen Genet</source>
            <pubdate>1995</pubdate>
            <volume>247</volume>
            <fpage>633</fpage>
            <lpage>638</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF00290355</pubid>
                  <pubid idtype="pmpid">7603443</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>The chromosome ends of <it>Saccharomyces cerevisiae</it></p>
            </title>
            <aug>
               <au>
                  <snm>Louis</snm>
                  <fnm>EJ</fnm>
               </au>
            </aug>
            <source>Yeast</source>
            <pubdate>1995</pubdate>
            <volume>11</volume>
            <fpage>1553</fpage>
            <lpage>1573</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1002/yea.320111604</pubid>
                  <pubid idtype="pmpid">8720065</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>The highly reduced genome of an enslaved algal nucleus</p>
            </title>
            <aug>
               <au>
                  <snm>Douglas</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zauner</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fraunholz</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Beaton</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Penny</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>LT</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Reith</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Cavalier-Smith</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Maier</snm>
                  <fnm>UG</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2001</pubdate>
            <volume>410</volume>
            <fpage>1091</fpage>
            <lpage>1096</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35074092</pubid>
                  <pubid idtype="pmpid" link="fulltext">11323671</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Complete nucleotide sequence of the chlorarachniophyte nucleomorph: Nature's smallest nucleus</p>
            </title>
            <aug>
               <au>
                  <snm>Gilson</snm>
                  <fnm>PR</fnm>
               </au>
               <au>
                  <snm>Su</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Slamovits</snm>
                  <fnm>CH</fnm>
               </au>
               <au>
                  <snm>Reith</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Keeling</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>McFadden</snm>
                  <fnm>GI</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>9566</fpage>
            <lpage>9571</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1480447</pubid>
                  <pubid idtype="pmpid" link="fulltext">16760254</pubid>
                  <pubid idtype="doi">10.1073/pnas.0600707103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Jam packed genomes &#8211; a preliminary, comparative analysis of nucleomorphs</p>
            </title>
            <aug>
               <au>
                  <snm>Gilson</snm>
                  <fnm>PR</fnm>
               </au>
               <au>
                  <snm>McFadden</snm>
                  <fnm>GI</fnm>
               </au>
            </aug>
            <source>Genetica</source>
            <pubdate>2002</pubdate>
            <volume>115</volume>
            <fpage>13</fpage>
            <lpage>28</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1023/A:1016011812442</pubid>
                  <pubid idtype="pmpid" link="fulltext">12188044</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Transposable elements and the evolution of genome size in eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Kidwell</snm>
                  <fnm>MG</fnm>
               </au>
            </aug>
            <source>Genetica</source>
            <pubdate>2002</pubdate>
            <volume>115</volume>
            <fpage>49</fpage>
            <lpage>63</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1023/A:1016072014259</pubid>
                  <pubid idtype="pmpid" link="fulltext">12188048</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Mobile elements: drivers of genome evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Kazazian</snm>
                  <fnm>HH</fnm>
                  <suf>Jr</suf>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2004</pubdate>
            <volume>303</volume>
            <fpage>1626</fpage>
            <lpage>1632</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1089670</pubid>
                  <pubid idtype="pmpid" link="fulltext">15016989</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Whole-genome shotgun assembly and analysis of the genome of <it>Fugu rubripes</it></p>
            </title>
            <aug>
               <au>
                  <snm>Aparicio</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Stupka</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Putnam</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Chia</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Dehal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Christoffels</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rash</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hoon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Smit</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gelpke</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Roach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Oh</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ho</snm>
                  <fnm>IY</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Detter</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Verhoef</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Predki</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Tay</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Richardson</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Edwards</snm>
                  <fnm>YJ</fnm>
               </au>
               <au>
                  <snm>Doggett</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Zharkikh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Tavtigian</snm>
                  <fnm>SV</fnm>
               </au>
               <au>
                  <snm>Pruss</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Barnstead</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Evans</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Baden</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Powell</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Glusman</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Rowen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Hood</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>YH</fnm>
               </au>
               <au>
                  <snm>Elgar</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Hawkins</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Venkatesh</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Rokhsar</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Brenner</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>297</volume>
            <fpage>1301</fpage>
            <lpage>1310</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1072104</pubid>
                  <pubid idtype="pmpid" link="fulltext">12142439</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Eukaryotic transposable elements and genome evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Finnegan</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>1989</pubdate>
            <volume>5</volume>
            <fpage>103</fpage>
            <lpage>107</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0168-9525(89)90039-5</pubid>
                  <pubid idtype="pmpid">2543105</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Complete genome sequence of the shrimp white spot bacilliform virus</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>He</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Pan</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>X</fnm>
               </au>
            </aug>
            <source>J Virology</source>
            <pubdate>2001</pubdate>
            <volume>75</volume>
            <fpage>11811</fpage>
            <lpage>11820</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">114767</pubid>
                  <pubid idtype="pmpid" link="fulltext">11689662</pubid>
                  <pubid idtype="doi">10.1128/JVI.75.23.11811-11820.2001</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Carotenoid biosynthesis in the primitive red alga <it>Cyanidioschyzon merolae</it></p>
            </title>
            <aug>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>FX</fnm>
                  <suf>Jr</suf>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Gantt</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Euk Cell</source>
            <pubdate>2006</pubdate>
            <volume>6</volume>
            <fpage>533</fpage>
            <lpage>545</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1128/EC.00265-06</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Evolutionary analysis of <it>Arabidopsis</it>, cyanobacterial, and chloroplast genomes reveals plastid phylogeny and thousands of cyanobacterial genes in the nucleus</p>
            </title>
            <aug>
               <au>
                  <snm>Martin</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Rujan</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Richly</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hansen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cornelsen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lins</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Leister</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Stoebe</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hasegawa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Penny</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2002</pubdate>
            <volume>99</volume>
            <fpage>12246</fpage>
            <lpage>12251</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">129430</pubid>
                  <pubid idtype="pmpid" link="fulltext">12218172</pubid>
                  <pubid idtype="doi">10.1073/pnas.182432999</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Phylogeny of plastids based on cladistic analysis of gene loss inferred from complete plastid genome sequences</p>
            </title>
            <aug>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Ohta</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Matsuzaki</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Misumi</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>2003</pubdate>
            <volume>57</volume>
            <fpage>377</fpage>
            <lpage>382</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00239-003-2486-6</pubid>
                  <pubid idtype="pmpid" link="fulltext">14708571</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Genome Analysis. Comparative genomics of two closely related unicellular thermo-acidophilic red algae, <it>Galdieria sulphuraria </it>and <it>Cyanidioschyzon merolae</it>, reveals the molecular basis of the metabolic flexibility of <it>Galdieria </it>and significant differences in carbohydrate metabolism of both algae</p>
            </title>
            <aug>
               <au>
                  <snm>Barbier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Oesterhelt</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Larson</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Halgren</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Wilkerson</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Garavito</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Benning</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Weber</snm>
                  <fnm>APM</fnm>
               </au>
            </aug>
            <source>Plant Physiol</source>
            <pubdate>2005</pubdate>
            <volume>137</volume>
            <fpage>460</fpage>
            <lpage>474</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1065348</pubid>
                  <pubid idtype="pmpid" link="fulltext">15710685</pubid>
                  <pubid idtype="doi">10.1104/pp.104.051169</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Mitochondrial nuclei</p>
            </title>
            <aug>
               <au>
                  <snm>Kuroiwa</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Int Rev Cytol</source>
            <pubdate>1982</pubdate>
            <volume>75</volume>
            <fpage>1</fpage>
            <lpage>59</lpage>
            <xrefbib>
               <pubid idtype="pmpid">6179895</pubid>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
