<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-8-81</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Methodology article</dochead>
      <bibl>
         <title>
            <p>Spotted cotton oligonucleotide microarrays for gene expression analysis</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Udall</snm>
               <mi>A</mi>
               <fnm>Joshua</fnm>
               <insr iid="I1"/>
               <email>jaudall@byu.edu</email>
            </au>
            <au id="A2">
               <snm>Flagel</snm>
               <mi>E</mi>
               <fnm>Lex</fnm>
               <insr iid="I2"/>
               <email>flagel@iastate.edu</email>
            </au>
            <au id="A3">
               <snm>Cheung</snm>
               <fnm>Foo</fnm>
               <insr iid="I3"/>
               <email>fcheung@tigr.org</email>
            </au>
            <au id="A4">
               <snm>Woodward</snm>
               <mi>W</mi>
               <fnm>Andrew</fnm>
               <insr iid="I4"/>
               <email>woodward@mail.utexas.edu</email>
            </au>
            <au id="A5">
               <snm>Hovav</snm>
               <fnm>Ran</fnm>
               <insr iid="I2"/>
               <email>ran@iastate.edu</email>
            </au>
            <au id="A6">
               <snm>Rapp</snm>
               <mi>A</mi>
               <fnm>Ryan</fnm>
               <insr iid="I2"/>
               <email>rrapp@iastate.edu</email>
            </au>
            <au id="A7">
               <snm>Swanson</snm>
               <mi>M</mi>
               <fnm>Jordan</fnm>
               <insr iid="I2"/>
               <email>swansonj@email.arizona.edu</email>
            </au>
            <au id="A8">
               <snm>Lee</snm>
               <mi>J</mi>
               <fnm>Jinsuk</fnm>
               <insr iid="I4"/>
               <email>jenny-lee@mail.utexas.edu</email>
            </au>
            <au id="A9">
               <snm>Gingle</snm>
               <mi>R</mi>
               <fnm>Alan</fnm>
               <insr iid="I5"/>
               <email>agingle@uga.edu</email>
            </au>
            <au id="A10">
               <snm>Nettleton</snm>
               <fnm>Dan</fnm>
               <insr iid="I6"/>
               <email>dnett@iastate.edu</email>
            </au>
            <au id="A11">
               <snm>Town</snm>
               <mi>D</mi>
               <fnm>Christopher</fnm>
               <insr iid="I3"/>
               <email>cdtown@tigr.org</email>
            </au>
            <au id="A12">
               <snm>Chen</snm>
               <fnm>Z Jeffrey</fnm>
               <insr iid="I4"/>
               <email>zjchen@mail.utexas.edu</email>
            </au>
            <au id="A13">
               <snm>Wendel</snm>
               <mi>F</mi>
               <fnm>Jonathan</fnm>
               <insr iid="I2"/>
               <email>jfw@iastate.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Plant and Animal Sciences, Brigham Young University, Provo, UT, 84062, USA</p>
            </ins>
            <ins id="I2">
               <p>Department of Ecology, Evolution, and Organismal Biology, Iowa State University, Ames, IA, 50011, USA</p>
            </ins>
            <ins id="I3">
               <p>The Institute for Genomic Research, A Division of the J. Craig Venter Institute, 9712 Medical Center Drive, Rockville MD 20850 USA</p>
            </ins>
            <ins id="I4">
               <p>Section of Molecular Cell and Developmental Biology and Institute for Cellular and Molecular Biology, University of Texas, Austin, TX, 78712, USA</p>
            </ins>
            <ins id="I5">
               <p>Center for Applied Genetic Technologies, University of Georgia, Athens, Georgia, 30602, USA</p>
            </ins>
            <ins id="I6">
               <p>Department of Statistics, Iowa State University, Ames, IA, 50011, USA</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>1</issue>
         <fpage>81</fpage>
         <url>http://www.biomedcentral.com/1471-2164/8/81</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17389046</pubid>
               <pubid idtype="doi">10.1186/1471-2164-8-81</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>24</day>
               <month>10</month>
               <year>2006</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>27</day>
               <month>3</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>27</day>
               <month>3</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Udall et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Microarrays offer a powerful tool for diverse applications plant biology and crop improvement. Recently, two comprehensive assemblies of cotton ESTs were constructed based on three <it>Gossypium </it>species. Using these assemblies as templates, we describe the design and creation and of a publicly available oligonucleotide array for cotton, useful for all four of the cultivated species.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Synthetic oligonucleotide probes were generated from exemplar sequences of a global assembly of 211,397 cotton ESTs derived from >50 different cDNA libraries representing many different tissue types and tissue treatments. A total of 22,787 oligonucleotide probes are included on the arrays, optimized to target the diversity of the transcriptome and previously studied cotton genes, transcription factors, and genes with homology to <it>Arabidopsis</it>. A small portion of the oligonucleotides target unidentified protein coding sequences, thereby providing an element of gene discovery. Because many oligonucleotides were based on ESTs from fiber-specific cDNA libraries, the microarray has direct application for analysis of the fiber transcriptome. To illustrate the utility of the microarray, we hybridized labeled bud and leaf cDNAs from <it>G. hirsutum </it>and demonstrate technical consistency of results.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>The cotton oligonucleotide microarray provides a reproducible platform for transcription profiling in cotton, and is made publicly available through <url>http://cottonevolution.info</url>.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p><it>Gossypium </it>contains nine different genome groups comprising approximately 50 species whose phylogenetic relationships have been well-studied <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. The A-, D-, and AD-genome groups have received special attention, as four different species [<it>Gossypium herbaceum </it>(A1), <it>Gossypium arboreum </it>(A2), <it>Gossypium hirsutum </it>(AD1) and <it>Gossypium barbadense </it>(AD2)] have been domesticated for their abundant seed trichomes. These species collectively provide the foundation for the textile industry worldwide, with most cotton today deriving from <it>G. hirsutum</it>, or upland cotton. Relationships among genome groups have been quantified in several studies, and the closest living relatives of the diploid genome donors to allopolyploid cotton have been identified <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>. The diploid donor of the allopolyploid A<sub>T </sub>genome [where the T subscript indicates the A genome in the tetraploid (AD) nucleus], was a species much like modern <it>G. arboreum </it>or <it>G. herbaceum</it>, whereas the allopolyploid D<sub>T </sub>genome is derived from a progenitor similar to modern <it>G. raimondii</it>. These well-established relationships provide a phylogenetic framework to investigate the evolution of gene expression both in terms of domesticated fiber production and polyploidy.</p>
         <p>Microarrays are a powerful method to simultaneously measure relative expression levels for thousands of genes and they may be composed of cDNA inserts, short oligonucleotides, or long oligonucleotides. The advantages and disadvantages of each of these probe types have been extensively reviewed <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr></abbrgrp> We chose to create a long oligonucleotide microarray for cotton because of its low manufacturing cost, flexibility in design, homogeneous melting temperatures (T<sub>m</sub>), and relative ease of adding probes. A small EST assembly (~45,000 ESTs) was previously used to generate oligonucleotide probes for cotton fiber <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. A larger scale EST assembly (> 150,000 ESTs) was recently produced as a community-wide effort by cotton researchers <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. Subsequent additions of cotton ESTs to Genbank (> 210,000 ESTs) have been compiled into a large EST assembly [TIGR Cotton Gene Index 8, (CGI8)] <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. These two assemblies constitute nearly all of the known genic sequence from cotton. Similar large-scale EST assemblies have been successfully used to design oligonucleotide microarrays for functional genomics investigations in model plants (<it>e.g. Arabidopsis</it><abbrgrp><abbr bid="B12">12</abbr></abbrgrp> and rice<abbrgrp><abbr bid="B13">13</abbr></abbrgrp>) and non-model plants (<it>e.g</it>. maize<abbrgrp><abbr bid="B14">14</abbr></abbrgrp> and tomato<abbrgrp><abbr bid="B15">15</abbr></abbrgrp>).</p>
         <p>Here we describe the design and creation and of a publicly available oligonucleotide microarray for cotton. Synthetic oligonucleotide probes were generated from the sequences of two different assemblies of cotton ESTs representing more than 50 different cDNA libraries and many different tissue types and tissue treatments <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr></abbrgrp> To illustrate their utility on printed microarray slides, we hybridized labeled bud and leaf cDNAs from <it>G. hirsutum</it>, and demonstrate technical consistency of results. As many of these EST sequences were derived from a fiber-specific cDNA library, this array also has direct application for analysis of the fiber transcriptome.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Microarray design</p>
            </st>
            <p>We created an oligonucleotide microarray for cotton using fiber genes in Genbank, a reported EST assembly of >150,000 ESTs <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, and a recent assembly of >210,000 ESTs <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> as templates for probe design. From these sequences, we designed three sets of oligonucleotide probes (1,154, 12,006, and 9,629, respectively) and included all three sets (22,787 total oligonucleotides) on a single, publicly available microarray <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>. The first set of 1,154 oligonucleotide probes was designed from Cotton ESTs with homology to <it>Arabidopsis </it>genes with roles as regulators of chromatin, transcription, cell wall biosynthesis, and cell cycle <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>.</p>
            <p>The second set of oligonucleotides probes was designed from an exemplar sequence set <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> using Picky v1.0 <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. An exemplar sequence refers to an example gene (<it>i.e</it>., the longest) chosen from a clustered set of unigenes by single-linkage clustering with BLASTN <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. Picky prioritized the unique sequence of the identified oligonucleotide probes while maintaining a uniform probe-target melting temperature. 12,006 oligonucleotides (66 bp average length; 3.5 s.d.) with a relatively small range of melting temperatures (T<sub>m</sub>, 78.33 &#177; 1.40 s.d.) were selected from a large list of candidate probes. This list of targeted genes includes genes requested by members of cotton research community, a large number of transcription factors, and several thousand genes that had homology to <it>Arabidopsis </it>genes (Table <tblr tid="T1">1</tblr>) [see Additional file <supplr sid="S1">1</supplr>].</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Oligonucleotide probes were designed separately from three different sets of ESTs.</p>
               </caption>
               <tblbdy cols="5">
                  <r>
                     <c ca="left">
                        <p>Types of probes</p>
                     </c>
                     <c ca="left">
                        <p>1<sup>st </sup>oligo set<sup>1</sup></p>
                     </c>
                     <c ca="left">
                        <p>2<sup>nd </sup>oligo set<sup>2</sup></p>
                     </c>
                     <c ca="left">
                        <p>3<sup>rd </sup>oligo set<sup>3</sup></p>
                     </c>
                     <c ca="left">
                        <p>Totals<sup>4</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p><it>Arabidopsis </it>matches<sup>5</sup></p>
                     </c>
                     <c ca="left">
                        <p>866</p>
                     </c>
                     <c ca="left">
                        <p>7,419</p>
                     </c>
                     <c ca="left">
                        <p>4,031</p>
                     </c>
                     <c ca="left">
                        <p>12,316</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Singletons</p>
                     </c>
                     <c ca="left">
                        <p>na</p>
                     </c>
                     <c ca="left">
                        <p>5,280</p>
                     </c>
                     <c ca="left">
                        <p>3,852</p>
                     </c>
                     <c ca="left">
                        <p>9,132</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transcription factors (TF)<sup>6</sup></p>
                     </c>
                     <c ca="left">
                        <p>230</p>
                     </c>
                     <c ca="left">
                        <p>2,223</p>
                     </c>
                     <c ca="left">
                        <p>677</p>
                     </c>
                     <c ca="left">
                        <p>3,130</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>GO Biological Process<sup>7</sup></p>
                     </c>
                     <c ca="left">
                        <p>46</p>
                     </c>
                     <c ca="left">
                        <p>464</p>
                     </c>
                     <c ca="left">
                        <p>126</p>
                     </c>
                     <c ca="left">
                        <p>636</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>GO Molecular Function<sup>8</sup></p>
                     </c>
                     <c ca="left">
                        <p>184</p>
                     </c>
                     <c ca="left">
                        <p>1,759</p>
                     </c>
                     <c ca="left">
                        <p>551</p>
                     </c>
                     <c ca="left">
                        <p>2,494</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>PFAM<sup>9</sup></p>
                     </c>
                     <c ca="left">
                        <p>na</p>
                     </c>
                     <c ca="left">
                        <p>471</p>
                     </c>
                     <c ca="left">
                        <p>na</p>
                     </c>
                     <c ca="left">
                        <p>471</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total number of oligos</p>
                     </c>
                     <c ca="left">
                        <p>1,154</p>
                     </c>
                     <c ca="left">
                        <p>12,006</p>
                     </c>
                     <c ca="left">
                        <p>9,629</p>
                     </c>
                     <c ca="left">
                        <p>22,789</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>1</sup>Oligonucleotides (oligos) were designed at Texas A&amp;M University in the former lab of Dr. Chen [17]. <sup>2</sup>Oligos designed at Iowa State University from a global assembly of ESTs [10]. <sup>3</sup>Oligos designed by The Institute for Genomic Research (TIGR) from the Cotton Gene Index 8 [11]. <sup>4</sup>Column totals are close approximations since each oligo set was designed separately. <sup>5</sup><it>Arabidopsis </it>matches are based on oligo WUBLASTX hits to the TAIR <it>Arabidopsis </it>protein dataset and parsed for 50 aa length and 50% percent identity. <sup>6</sup>Transcription factor sub-total may be an over-estimate as Biological Processes and Molecular Function are not mutually exclusive categories. <sup>7</sup>Biological Process = transcription. <sup>8</sup>Molecular Function = nucleic acid binding activity, nucleotide binding activity, RNA and DNA binding activity, and transcription factor activity. <sup>9</sup>Putative PFAM TF identified in the 2<sup>nd </sup>oligo set were in addition to those annotated by gene ontology.</p>
               </tblfn>
            </tbl>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Composition of the cotton oligonucleotide microarray</b>. 22,789 oligonucleotides were designed from three separate sets of genic sequences from cotton (See Table <tblr tid="T1">1</tblr>). The grey boxes represent the total number of probes in each set. The hatched boxes indicate the number of probes with a putative <it>Arabidopsis </it>hit. The black boxes indicate the number of probes designed from singletons from their respective assemblies. The remaining boxes with dotted squares indicate the number of probes targeting transcription factors.</p>
               </text>
               <file name="1471-2164-8-81-S1.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The third set ofoligonucleotides probes was designed from CGI8 <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> that contained 55,673 unique sequences using Picky v2.0. Where possible, identical Picky parameters were used to design the 3<sup>rd </sup>oligonucleotide set as the 2<sup>nd </sup>set. Probes that targeted the same genes as in the first two probe sets were excluded from further analysis. In total, 9,629 additional oligonucleotides probeswere generated (66 bp average length, 3.6 s.d.; 76.82 T<sub>m</sub>, s.d. 1.93) and added to the previous 2 probe sets.</p>
            <p>Two essential considerations of microarray quality include the number of targeted genes and the broad utility of the microarray for specific tissues or treatments. Regarding the first consideration, the 22,778 genes described here include perhaps 46&#8211;60% of the total genic diversity, given that the total number of genes in the cotton genome may be approximately 40,000&#8211;50,000 <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>, Indeed, 44% and 40% of the oligonucleotides were designed from singletons from the first <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> and second <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> assemblies, respectively. However, some probes were not completely target-specific, perhaps due to imperfect EST assemblies and due to separate sets of probes designed from different assemblies. Approximately 1,800 of potential non-specific homologies were identified in the recent Gene Index of 55,673 unigenes <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> using vmatch <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> with a ~95% sequence percent identity threshold. Nevertheless, most of the oligonucleotides had a single target, as designed [see Additional file <supplr sid="S2">2</supplr>].</p>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p><b>Distribution of the number of matches of oligonucleotide probes to the Cotton Gene Index 8 (CGI8) assembly</b>. All three sets were queried within the sequences of the CGI8 assembly and only a small number (1,773) of probes target (>93% percent identity) more than one CGI8 unigene indicating a potential cross-hybridization or an 'over-split' assembly for the targeted gene.</p>
               </text>
               <file name="1471-2164-8-81-S2.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Regarding the second consideration, these microarray probes have a broad utility for specific tissues or treatments. For example, a detailed analysis of the second probe set revealed that ~7,300 probes represented genes expressed in specific tissues or under specific conditions [see Additional file <supplr sid="S3">3</supplr>]. The number of specifically expressed genes was determined by summing the number of contigs mostly composed of ESTs from a single library (90%) and the corresponding singletons. In total, 56% of the 2<sup>nd </sup>oligonucleotide set represent genes from a specific library; however, a large number of those genes (24%) are from the two <it>G. raimondii </it>libraries that were prepared from heterogeneous tissues and which were more deeply sampled that most of the other cotton cDNA libraries. More than 1,000 oligonucleotides appear to target genes found only in a 7&#8211;10 days post-anthesis fiber library <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, and 733 appear to target transcripts uniquely identified following cyclohexamide treatment of ovules <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. These two considerations suggest that the oligonucleotides selected for the cotton oligonucleotide microarray have a broad diagnostic utility while potentially targeting tissue-specific transcripts expressed under a variety of conditions. The sequences and annotations of all the probes are publicly available via a web-based query <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> or by request.</p>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Many of the oligonucleotides from the 2<sup>nd </sup>set were derived from contigs or singletons representing individual libraries (n = 7,319)</b>. Library totals reflect the contigs (respective library's ESTs > 90%) and singletons used to design the oligonucleotides. The two large <it>G. raimondii </it>libraries created from heterogeneous seedling and whole flower tissue are not illustrated.</p>
               </text>
               <file name="1471-2164-8-81-S3.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Microarray hybridizations</p>
            </st>
            <p>Many potential sources of error can have a large impact on microarray experiments, such as inconsistency among multiple RNA extractions, reverse transcription, RNA amplification, and labeling, as well as different levels of background noise for each microarray. Many of these sources of error can be resolved by appropriate experimental design <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr></abbrgrp>. and careful laboratory technique; however, the quality of the microarray must often be assumed and often is not under the control of the investigator. We investigated the oligonucleotide performance within the first version of the cotton microarray [Gene Expression Omnibus (GEO) database: GPL4305] containing the 1<sup>st </sup>and 2<sup>nd </sup>replicated spots printed for each probe in these two sets. We found a low level of within-microarray variation, reproducible 'self vs. self' hybridizations with bud tissue, and reproducible expression differences between bud and leaf treatments. The results from the first version of the cotton microarray suggest that the current version with 9,629 additional probes will provide an robust, reproducible platform for transcription profiling in cotton.</p>
            <p>Variation within microarrays between the two replicate features was estimated for each oligonucleotide probe, as a consequence of including two microarray features for each oligonucleotide probe in two separate sections of the microarray. The average log-adjusted difference between two replicated features was 0.03 (s.d. 0.69), 0.02 (s.d. 0.80), and 0.02 (s.d. 0.83) for replications 1, 2, and 3, respectively (Figure <figr fid="F1">1A</figr>). The slightly positive value of the average spot differences suggests that the first pin-touch on the microarray deposited slightly more oligonucleotide probe in a slightly larger spot on the slide than the second pin-touch.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>A reproducible platform for transcription profiling using cotton microarrays</p>
               </caption>
               <text>
                  <p><b>A reproducible platform for transcription profiling using cotton microarrays</b>. A) Differences detected between duplicated spots plotted by their mean expression value from replicate 1 of the experiment. Each plot is hexagonally-binned to uncover the density component that is otherwise saturated by a cloud of data points. The difference of the log-adjusted, median centered duplicate spots is measured on the horizontal axis and the mean value of the same duplicated spots is measured on the vertical (values in grey, scale bars on left vertical axis). Most duplicated spots deviated very little, though genes with lower expression values tended to deviate more. Replication of the three treatment loop design indicated only minor detectable differences between duplicated spots. Nearly identical results were found for the other two replicates. B) Correlation of normalized, log-adjusted fluoresce intensity values for bud (Cy3) &#215; bud' (Cy5) for the first microarray of the first replication. A 45&#176; angle line has been overlaid to illustrate the expected 1:1 ratio of spot intensity. In this case, Cy3 labeled aRNA had higher intensity values on average; however, the effect of dye was removed from the contrast of differential expression in our analysis by including a dye component into our analytical model through dye swaps. C) Correlation of t-test p-values. Gene-specific tests for differential expression between bud and leaf and between bud' and leaf were conducted as described in Materials and Methods. The <it>p</it>-values from the bud' vs. leaf tests are plotted against the <it>p</it>-values from the bud vs. leaf tests on a negative natural log scale. The points in the upper right quadrant of the picture correspond to the genes with the smallest <it>p</it>-values. The points are scattered tightly around the 45 degree line, indicating that that <it>p</it>-values for the most significant genes were very similar according to both comparisons.</p>
               </text>
               <graphic file="1471-2164-8-81-1"/>
            </fig>
            <p>We also demonstrated the reproducibility of the microarray by quantifying the amount of variation for these newly constructed cotton microarrays between two identical pooled 'treatments' of bud RNA (bud and bud'). On the individual microarrays, there was a high degree of correlation between the Cy3-labeled bud RNA and the Cy5-labeled bud RNA (<it>r </it>= 0.92 data not shown). When searching for expression differences between bud and bud' RNA pools, no differences were detected at a relatively liberal false discovery rate of 20% (Table <tblr tid="T2">2</tblr>).</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Number of differentially expressed genes at different levels of false discovery [34].</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="left">
                        <p>Comparison</p>
                     </c>
                     <c ca="center">
                        <p>0.001</p>
                     </c>
                     <c ca="center">
                        <p>0.010</p>
                     </c>
                     <c ca="center">
                        <p>0.050</p>
                     </c>
                     <c ca="center">
                        <p>0.100</p>
                     </c>
                     <c ca="center">
                        <p>0.200</p>
                     </c>
                     <c ca="center">
                        <p>0.300</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>bud &#8211; bud'</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>bud &#8211; leaf</p>
                     </c>
                     <c ca="center">
                        <p>2167</p>
                     </c>
                     <c ca="center">
                        <p>4,506</p>
                     </c>
                     <c ca="center">
                        <p>6,562</p>
                     </c>
                     <c ca="center">
                        <p>7,600</p>
                     </c>
                     <c ca="center">
                        <p>8,933</p>
                     </c>
                     <c ca="center">
                        <p>9,694</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>bud' &#8211; leaf</p>
                     </c>
                     <c ca="center">
                        <p>2232</p>
                     </c>
                     <c ca="center">
                        <p>4,608</p>
                     </c>
                     <c ca="center">
                        <p>6,506</p>
                     </c>
                     <c ca="center">
                        <p>7,641</p>
                     </c>
                     <c ca="center">
                        <p>9,007</p>
                     </c>
                     <c ca="center">
                        <p>9,654</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>Finally, if we test for expression differences between the leaf RNA pool and each of the bud RNA pools (bud and bud'), many genes were found to be consistently differentially expressed between bud vs. leaf and bud' vs. leaf, as seen by the high correlation among the most significant p-values (Figure <figr fid="F1">1B</figr>). If our goal was to describe differentially expressed genes between leaf and bud, we would have a large list of putatively, differentially expressed genes (Table <tblr tid="T2">2</tblr>); however, in this particular case, we can only claim that these genes were differentially expressed between the two amplified RNA samples considered in our experiment. We intentionally did not include biological replicates because our interest was in quantifying technical variation. Biological replication would be necessary to conclude that the expression differences are inherent differences between leaf and bud rather than simply differences between the particular leaf RNA pool and the particular bud and bud' RNA pools prepared for this experiment.</p>
            <p>Because a global assembly of ESTs was used to design this first version of the microarray, genes expressed in many tissues of the plants including cotton fibers, are represented. A total of 1,864 genes were found to be differentially expressed between our leaf RNA pool and our bud RNA pools (false discovery rate = 0.001; Figure <figr fid="F1">1C</figr>). (Again note that these are differences between our RNA pools rather than inherent expression differences between general leaf and bud tissues.) Of these differences, slightly less than 10% belonged to set of probes that had no BLASTX hit (&lt; 1 &#215; 10<sup>-20</sup>) and were designed solely based on an ESTScan prediction, thereby providing an element of functional gene discovery to the microarray. Of the 1,864 hypothetical genes that were differentially expressed, 602 were identified by probes derived from cotton fiber cDNA libraries <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>; Ben Burr, unpublished data; Candace Haigler, unpublished data). This number did not include probes designed for known cotton genes, nor other genes that were removed from the analysis (low expressed fiber genes that may not be detected in leaf or bud aRNA) that may also represent genes specifically expressed in fiber tissue.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>Here we provide a detailed report of the design of long-oligonucleotide microarrays for cotton and illustrate their technical performance. Proper design of microarray experiments for discovery of gene expression profiles requires biological replication <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr><abbr bid="B26">26</abbr></abbrgrp> Because our goal was not to discover nor report novel gene expression profiles in leaves or buds, we restricted our replications to pools of technical replicates in this experiment. These cotton microarrays are publicly available <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, and may continue to be augmented with additional oligonucleotides designed from subsequent ESTs assemblies. As a tool for functional genomics, the future use of these microarrays may uncover clues to the transcriptional regulation of cotton fiber and other tissues in properly replicated experimental designs.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Microarray probe selection</p>
            </st>
            <p>A total of 22,787 probes were printed on the cotton oligonucleotide microarray, composed of 12,006 oligonucleotides selected from recently reported contigs and singletons derived from a global assembly of cotton ESTs <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, and 9,629 designed against the latest TIGR cotton transcript assembly (CGI8). We also included 1,154 oligonucleotides designed in the Z. J. Chen laboratory based on previously available sequence data <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>.</p>
            <p>Similar probe design strategies were used for all threes sets of probes. Lee et al. <abbrgrp><abbr bid="B17">17</abbr></abbrgrp> provided a description for the design first set of oligonucleotides. The second and third set of oligonucleotides were designed from the EST exemplar sequences <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> and the TIGR Gene Index <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> with Picky (v 1.0) <abbrgrp><abbr bid="B18">18</abbr></abbrgrp> and Picky (2.0), respectively. Only EST sequences with predicted a protein from ESTScan <abbrgrp><abbr bid="B28">28</abbr></abbrgrp> or a high protein homology (70% percent identity) to an <it>Arabidopsis </it>gene were considered candidates for oligonucleotide selection.</p>
            <p>Three different criteria were invoked in the iterative selection of the microarray probes from the EST assemblies: (1) candidate probes identified by Picky by their unique sequences, complexity, and T<sub>m</sub>; (2) characterized cotton mRNAs in GenBank and genes of special interest to the cotton community; and (3) complementation to previously synthesized probe set(s). Thus, for each oligonucleotide set, candidate long-oligonucleotide probes (60 &#8211; 70 mers) were separately generated based on criteria 1 and 2, then a final list of probes was selected for oligonucleotide synthesis by cross-checking the new list of probes with previously synthesized oligonucleotides.</p>
            <p>For design of both the second and third probe sets, we solicited input from the cotton community to identify genes of interest for microarray probe design. Most requests were for known cotton genes with sequences in Genbank, in addition to candidate genes identified in our EST assembly by high homology to genes characterized in other organisms. Probes for these genes were designed with the sequences from the EST assemblies as 'background' to identify the most unique probes possible.</p>
            <p>Both transcription factors and genes with little or no annotation were represented on the cotton microarray. Based on widespread interest in transcription factor expression levels, we selected probes targeting genes that had either a transcription related GO ontology <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>, or a transcript factor domain as predicted by PFAM <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> (Table <tblr tid="T1">1</tblr>). Genes with little or no annotation represent a gene discovery component to future microarray experiments. When genes targeted by the 2<sup>nd </sup>probe second were compared to the <it>Arabidopsis </it>TAIR protein dataset, 1,200 of them did not have a significant BLASTX hit (&lt; 1e-20) but they did have a coding frame as predicted by ESTScan <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Oligonucleotide synthesis and microarray printing</p>
            </st>
            <p>Each set of oligonucleotides was synthesized and aliquoted into 3 replicate plates by IDT Technologies (Coralville, IA, USA). An aliquot of 384-well plates from all three sets of oligonucleotides was hydrated in water then diluted to the printing concentration with 3&#215; SSC. Positive and negative controls were included on the printed microarrays. To assess microarray quality, two spots of each oligo from the same pin-dip were printed in separate slide sections on Corning epoxy slides at the Washington University Microarray Core facility using a locally constructed linear servo arrayer (after the DeRisi model <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>) creating the first version of the cotton oligonucleotide microarray [GEO: GPL4305]. After printing, slides were allowed to dry in 50&#8211;70% humidity for 12&#8211;16 hrs (~25&#176;C) and cross-linked at 150 mJoules. Two slides from the print batch were checked using SpotCheck (Genetix). Printed cotton microarrays, and images of each print batch are publicly available <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>. Experiments using the preliminary platform [GEO: GPL4305] or this new platform [GEO: GPL4808] can be found at GEO <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>RNA extraction</p>
            </st>
            <p>One leaf and one bud (10 &#8211; 14 days before anthesis) tissue sample of <it>G. hirsutum </it>cv. Acala Maxxa were collected from three separate replications of 4 &#8211; 8 plants grown in Horticulture Greenhouse at Iowa State University under supplemental lighting (16 hr. days). RNA was extracted from each of the six samples using a modified hot-borate method <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>, quantified, and checked for integrity using a Bioanalyzer (Agilent, Inc., Palo Alto, CA, USA). Equimolar amounts of RNA (A<sub>260</sub>) from three separate extractions were pooled into a single leaf and single bud sample, respectively.</p>
         </sec>
         <sec>
            <st>
               <p>RNA amplificationand labeling</p>
            </st>
            <p>An indirect labeling procedure of amplified aminoallyl.aRNA (TargetAmp&#8482;, Epicentre Biotechnologies, Madison, WI, USA) was used for one leaf RNA sample and one bud RNA sample. 0.5 ug of total RNA was used as starting material for 1 round of aRNA amplification, resulting in 26 ug and 51 ug of aRNA from leaves and buds, respectively.</p>
            <p>Cy3 and Cy5 dyes (Amersham Biosciences, Pittsburgh, PA, USA) were coupled to two aliquots of 13 and 16 ug of both aRNA samples, respectively. The Cy3- and Cy5-labeled aRNA probes were purified using the Qiagen RNA easy Mini kit (Qiagen, Germantown MD, USA). and sufficient incorporation Cy3 (550 nm) and Cye5 (650 nm) dyes was verified.</p>
         </sec>
         <sec>
            <st>
               <p>Microarray hybridization and image analysis</p>
            </st>
            <p>For microarray hybridization, 300 ng of Cy3 and Cy5 labeled aRNA was used per each slide using the Pronto!&#8482; Plus system protocol (Promega Corporation, Madison WI, USA) with minor changes as described below. Slides from each rep (3) were immersed in 200 ml of Pronto Universal Pre-Soak solution containing 2 ml of liquid Sodium Borohydride for 20 min at 42&#176;C. Slides were transferred to fresh containers with Wash Solution 2 at room temperature for 2 min and then immersed in 200 ml of hybridization buffer (5 &#215; SSC; 0.1 &#215; SDS; BSA 0.1 mg/ml). Slides then were incubated with a fresh Wash Solution 2 at room temperature for 2 min, and were washed 2 additional times with Wash Solution 3 at room temperature for 2 min each. Following immersion in nuclease-free water, slides were dried by centrifugation at 1,600 g for 3 min. All hybridizations and post-hybridization washes were performed exactly as described in the Pronto!&#8482; Plus system protocol.</p>
            <p>Microarray images were captured using an arrayWoRx<sup>&#174; </sup>Biochip Reader (Applied Precision, Issaquah, WA, USA) using an exposure of 0.5 sec for each channel (Cy5 and Cy3) at ~10 um resolution. GenPix<sup>&#174; </sup>Pro (v 5.1, Molecular Devices, Sunnyvale, CA, USA) was used to extract the background-adjusted intensity of each spot. Features that were 'absent', 'not-found', or that had a negative intensity after background adjustment were excluded from the analysis. Data files from this experiment can be found in GEO data set [GSE5875].</p>
         </sec>
         <sec>
            <st>
               <p>Experimental design and statistical analysis</p>
            </st>
            <p>Three replications of a three treatment loop design (bud &#8594; leaf, leaf &#8594; bud', and bud' &#8594; bud) were hybridized on nine microarrays, where bud and bud' simply represent different aliquots of the same aRNA. The signal intensity data were natural log transformed and median normalized, and the 9,654 genes with complete data were examined for expression differences among the three sample types (leaf, bud, and bud'). We considered a standard mixed linear model for the data from any single gene given by</p>
            <p><it>y</it><sub><it>ijk </it></sub>= <it>&#956; </it>+ <it>&#948;</it><sub><it>i </it></sub>+ <it>&#964;</it><sub><it>j </it></sub>+ <it>s</it><sub><it>k </it></sub>+ <it>e</it><sub><it>ijk</it></sub>,</p>
            <p>where <it>y</it><sub><it>ijk </it></sub>denotes the normalized log-scale signal intensity (averaged over duplicate spots) for dye <it>i</it>, sample type <it>j</it>, and slide <it>k</it>; <it>&#956; </it>denotes a an intercept parameter; <it>&#948;</it><sub><it>i </it></sub>denotes the effect of dye <it>i</it>; <it>&#964;</it><sub><it>j </it></sub>denotes the effect of sample type <it>j</it>; <it>s</it><sub><it>k </it></sub>denotes the random effect of slide <it>k</it>; and <it>e</it><sub><it>ijk </it></sub>denotes a random error term that is intended to capture all other sources of variability. (Note that although we considered a separate model for each gene, we have suppressed a gene subscript on each term to simplify notation.) Here <it>i </it>= 1, 2 (Cy3 and Cy5); <it>j </it>= 1, 2, 3 (bud, bud', and leaf); and <it>k </it>= 1, ..., 9 (microarray slides 1 &#8211; 9). On the basis of this model, <it>t</it>-tests for differential expression between each pair of sample types (leaf vs. bud, leaf vs. bud', and bud vs. bud') were conducted. The 9,654 <it>p</it>-values from each of these comparisons were converted to <it>q</it>-values using the method of Story and Tibshirani <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. These <it>q</it>-values were used to identify the number of differentially expressed genes for a given comparison when controlling the false discovery rate at various levels.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>ESTs: Expressed sequence tags</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>JJW, JJL, and ZJC designed and provided the first set of oligonucleotides. JAU, JMS, JFW, and ZJC designed, analyzed, and provided the second set of oligonucleotides. FC, AWW, CDT, and ZJC designed and provided the final set of oligonucleotides. LF and JAU grew the plants and extracted RNA. RH, LF, and RAR amplified, labeled, and performed the microarray hybridizations. DN provided the statistical model and analytical framework. LF, JAU, and DN analyzed and interpreted the data. ARG customized an internet accessible MIAME-compliant Stanford Microarray Database for these arrays and created a GEO microarray platform for this and future experiment submissions. JAU, RAR, and JFW conceived the experiment. JAU and JFW drafted the manuscript. All authors have read and approved the manuscript.</p>
      </sec>
      <sec>
         <st>
            <p>Availability and requirements</p>
         </st>
         <p>Project name: The evolutionary genomics of cotton</p>
         <p>Project home page: <url>http://cottonevolution.info</url></p>
         <p>Operating system: Platform independent</p>
         <p>Programming language: HTML and XML</p>
         <p>License: no license required</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The work was supported by the grants from the National Science Foundation Plant Genome Research Program (DBI0211700 to J.F.W. and DBI0624077 to Z.J.C.).</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Polyploidy and the evolutionary history of cotton</p>
            </title>
            <aug>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
               <au>
                  <snm>Cronn</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Advances in Agronomy</source>
            <pubdate>2003</pubdate>
            <volume>78</volume>
            <fpage>139</fpage>
            <lpage>186</lpage>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Rapid diversification of the cotton genus (Gossypium: Malvaceae) revealed by analysis of sixteen nuclear and chloroplast genes</p>
            </title>
            <aug>
               <au>
                  <snm>Cronn</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Small</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Haselkorn</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Am J Bot</source>
            <pubdate>2002</pubdate>
            <volume>89</volume>
            <fpage>707</fpage>
            <lpage>725</lpage>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Rate variation among nuclear genes and the age of polyploidy in <it>Gossypium</it></p>
            </title>
            <aug>
               <au>
                  <snm>Senchina</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Alvarez</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Cronn</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Rong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Noyes</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Wilkins</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Molecular Biology and Evolution</source>
            <pubdate>2003</pubdate>
            <volume>20</volume>
            <fpage>633</fpage>
            <lpage>643</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1093/molbev/msg065</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Genetics, cytology, and evolution of <it>Gossypium</it></p>
            </title>
            <aug>
               <au>
                  <snm>Endrizzi</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Turcotte</snm>
                  <fnm>EL</fnm>
               </au>
               <au>
                  <snm>Kohel</snm>
                  <fnm>RJ</fnm>
               </au>
            </aug>
            <source>Advances in Genetics</source>
            <pubdate>1985</pubdate>
            <volume>23</volume>
            <fpage>271</fpage>
            <lpage>375</lpage>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Cotton</p>
            </title>
            <aug>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Evolution of crop plants</source>
            <publisher>London: Longman</publisher>
            <editor>Smartt J</editor>
            <pubdate>2000</pubdate>
            <fpage>358</fpage>
            <lpage>366</lpage>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Microarray expression profiling resources for plant genomics</p>
            </title>
            <aug>
               <au>
                  <snm>Rensink</snm>
                  <fnm>WA</fnm>
               </au>
               <au>
                  <snm>Buell</snm>
                  <fnm>CR</fnm>
               </au>
            </aug>
            <source>Trends in Plant Science</source>
            <pubdate>2005</pubdate>
            <volume>10</volume>
            <fpage>603</fpage>
            <lpage>609</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tplants.2005.10.003</pubid>
                  <pubid idtype="pmpid" link="fulltext">16275051</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>ESTs, cDNA microarrays, and gene expression profiling: tools for dissecting plant physiology and development</p>
            </title>
            <aug>
               <au>
                  <snm>Alba</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Fei</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Payton</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Debbie</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Cohn</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>D'Ascenzo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gordon</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Rose</snm>
                  <fnm>JKC</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Tanksley</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Bouzayen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jahn</snm>
                  <fnm>MM</fnm>
               </au>
               <au>
                  <snm>Giovannoni</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>The Plant Journal</source>
            <pubdate>2004</pubdate>
            <volume>39</volume>
            <fpage>697</fpage>
            <lpage>714</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-313X.2004.02178.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15315633</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Methods for transcriptional profiling in plants. Be fruitful and replicate</p>
            </title>
            <aug>
               <au>
                  <snm>Meyers</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Galbraith</snm>
                  <fnm>DW</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Agrawal</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Plant Physiology</source>
            <pubdate>2004</pubdate>
            <volume>135</volume>
            <fpage>637</fpage>
            <lpage>652</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">514100</pubid>
                  <pubid idtype="pmpid" link="fulltext">15173570</pubid>
                  <pubid idtype="doi">10.1104/pp.104.040840</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Functional genomics of cell elongation in developing cotton fibers</p>
            </title>
            <aug>
               <au>
                  <snm>Arpat</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Waugh</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sullivan</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Gonzales</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Frisch</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Main</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Wood</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Leslie</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Wilkins</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Plant Molecular Biology</source>
            <pubdate>2004</pubdate>
            <volume>54</volume>
            <fpage>911</fpage>
            <lpage>929</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s11103-004-0392-y</pubid>
                  <pubid idtype="pmpid" link="fulltext">15604659</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>A global assembly of cotton ESTs</p>
            </title>
            <aug>
               <au>
                  <snm>Udall</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Swanson</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Haller</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Rapp</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Sparks</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Hatfield</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Dowd</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Arpat</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Sickler</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Wilkins</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Guo</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>XY</fnm>
               </au>
               <au>
                  <snm>Scheffler</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Taliercio</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Turley</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>McFadden</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Payton</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Klueva</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Haigler</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wilkerson</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Suo</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schulze</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Pierce</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Essenberg</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Llewellyn</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Dennis</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Kudrna</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Soderlund</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Genome Research</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>441</fpage>
            <lpage>450</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1415220</pubid>
                  <pubid idtype="pmpid" link="fulltext">16478941</pubid>
                  <pubid idtype="doi">10.1101/gr.4602906</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The TIGR gene index project</p>
            </title>
            <url>http://compbio.dfci.harvard.edu/tgi</url>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Arabidopsis Oligonucleotide Microarrays</p>
            </title>
            <url>http://www.ag.arizona.edu/microarray</url>
         </bibl>
         <bibl id="B13">
            <title>
               <p>NSF Rice Oligonucleotide Array Project</p>
            </title>
            <url>http://www.ricearray.org</url>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Maize Oligonucleotide Array Project</p>
            </title>
            <url>http://www.maizearray.org</url>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Gene Expression Profiling at the Boyce Thompson Institute</p>
            </title>
            <url>http://bti.cornell.edu/CGEP/CGEP.html</url>
         </bibl>
         <bibl id="B16">
            <title>
               <p>The evolutionary genomics of cotton</p>
            </title>
            <url>http://cottonevolution.info</url>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Developmental and gene expression analyses of a cotton naked seed mutant</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hassan</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kohel</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>X-Y</fnm>
               </au>
               <au>
                  <snm>Payton</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Sze</snm>
                  <fnm>S-H</fnm>
               </au>
               <au>
                  <snm>Stelly</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Planta</source>
            <pubdate>2006</pubdate>
            <volume>223</volume>
            <fpage>418</fpage>
            <lpage>432</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00425-005-0098-7</pubid>
                  <pubid idtype="pmpid" link="fulltext">16254724</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Picky: oligo microarray design for large genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Chou</snm>
                  <fnm>H-H</fnm>
               </au>
               <au>
                  <snm>Hsia</snm>
                  <fnm>A-P</fnm>
               </au>
               <au>
                  <snm>Mooney</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Schnable</snm>
                  <fnm>PS</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2004</pubdate>
            <volume>20</volume>
            <fpage>2893</fpage>
            <lpage>2902</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/bth347</pubid>
                  <pubid idtype="pmpid" link="fulltext">15180932</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Differential lineage-specific amplification of transposable elements is responsible for genome size variation in <it>Gossypium</it></p>
            </title>
            <aug>
               <au>
                  <snm>Hawkins</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Nason</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Genome Research</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>1252</fpage>
            <lpage>1261</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gr.5282906</pubid>
                  <pubid idtype="pmpid" link="fulltext">16954538</pubid>
                  <pubid idtype="pmcid">1581434</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Differential methylation of genes and repeats in land plants</p>
            </title>
            <aug>
               <au>
                  <snm>Rabinowicz</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Citek</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Budiman</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Numberg</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bedell</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Lakey</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>O'Shaughnessy</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Nacimiento</snm>
                  <fnm>LU</fnm>
               </au>
               <au>
                  <snm>McCombie</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>Martienssen</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Genome Research</source>
            <pubdate>2005</pubdate>
            <volume>15</volume>
            <fpage>1431</fpage>
            <lpage>1440</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1240086</pubid>
                  <pubid idtype="pmpid" link="fulltext">16204196</pubid>
                  <pubid idtype="doi">10.1101/gr.4100405</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>The Vmatch large scale sequence analysis software</p>
            </title>
            <url>http://www.vmatch.de</url>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Cycloheximide treatment of cotton ovules alters the abundance of specific classes of mRNAs and generates novel ESTs for microarray expression profiling</p>
            </title>
            <aug>
               <au>
                  <snm>Wu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Rozenfeld</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Defferrard</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ruggiero</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Udall</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Llewellyn</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Dennis</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Molecular Genetics and Genomics</source>
            <pubdate>2005</pubdate>
            <volume>274</volume>
            <fpage>477</fpage>
            <lpage>493</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/s00438-005-0049-9</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Microarray data analysis: from disarray to consolidation and consensus</p>
            </title>
            <aug>
               <au>
                  <snm>Allison</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Cui</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Page</snm>
                  <fnm>GP</fnm>
               </au>
               <au>
                  <snm>Sabripour</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Nature Reviews Genetics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>55</fpage>
            <lpage>65</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrg1749</pubid>
                  <pubid idtype="pmpid" link="fulltext">16369572</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Design considerations for efficient and effective microarray studies</p>
            </title>
            <aug>
               <au>
                  <snm>Kerr</snm>
                  <fnm>KM</fnm>
               </au>
            </aug>
            <source>Biometrics</source>
            <pubdate>2003</pubdate>
            <volume>59</volume>
            <fpage>822</fpage>
            <lpage>828</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.0006-341X.2003.00096.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">14969460</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Fundamentals of experimental design for cDNA microarrays</p>
            </title>
            <aug>
               <au>
                  <snm>Churchill</snm>
                  <fnm>GA</fnm>
               </au>
            </aug>
            <source>Nature Genetics</source>
            <pubdate>2002</pubdate>
            <volume>32</volume>
            <fpage>S490</fpage>
            <lpage>S495</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1038/ng1031</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Design issues for cDNA microarray experiments</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>YH</fnm>
               </au>
               <au>
                  <snm>Speed</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Nature Reviews Genetics</source>
            <pubdate>2002</pubdate>
            <volume>3</volume>
            <fpage>579</fpage>
            <lpage>588</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12154381</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Methods for genome-wide analysis of gene expression changes in polyploids</p>
            </title>
            <aug>
               <au>
                  <snm>Wang</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Tian</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>HS</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rao</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>EN</fnm>
               </au>
               <au>
                  <snm>Doerge</snm>
                  <fnm>RW</fnm>
               </au>
               <au>
                  <snm>Comai</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>ZJ</fnm>
               </au>
            </aug>
            <source>Methods in Enzymology</source>
            <pubdate>2005</pubdate>
            <volume>395</volume>
            <fpage>570</fpage>
            <lpage>596</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0076-6879(05)95030-1</pubid>
                  <pubid idtype="pmpid" link="fulltext">15865985</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Modeling sequencing errors by combining Hidden Markov models</p>
            </title>
            <aug>
               <au>
                  <snm>Lottaz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Iseli</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Jongeneel</snm>
                  <fnm>CV</fnm>
               </au>
               <au>
                  <snm>Bucher</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>ii103</fpage>
            <lpage>ii112</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btg1067</pubid>
                  <pubid idtype="pmpid" link="fulltext">14534179</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Gene Ontology: tool for the unification of biology</p>
            </title>
            <aug>
               <au>
                  <snm>Ashburner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ball</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Blake</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Botstein</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Butler</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Cherry</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Dolinski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Dwight</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Eppig</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Hill</snm>
                  <fnm>DP</fnm>
               </au>
               <au>
                  <snm>Issel-Tarver</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Kasarskis</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Matese</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Richardson</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Ringwald</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rubin</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Sherlock</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Nature Genetics</source>
            <pubdate>2000</pubdate>
            <volume>25</volume>
            <fpage>25</fpage>
            <lpage>29</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/75556</pubid>
                  <pubid idtype="pmpid" link="fulltext">10802651</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>The Pfam protein families database</p>
            </title>
            <aug>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Coin</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Durbin</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Finn</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Hollich</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Khanna</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Marshall</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Moxon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>ELL</fnm>
               </au>
               <au>
                  <snm>Studholme</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Yeats</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Research</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>D138</fpage>
            <lpage>141</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308855</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681378</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh121</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>DeRisi Laboratory at University of California San Francisco</p>
            </title>
            <url>http://derisilab.ucsf.edu</url>
         </bibl>
         <bibl id="B32">
            <title>
               <p>NCBI GEO: mining millions of expression profiles &#8211; database and tools</p>
            </title>
            <aug>
               <au>
                  <snm>Barrett</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Suzek</snm>
                  <fnm>TO</fnm>
               </au>
               <au>
                  <snm>Troup</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Wilhite</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Ngau</snm>
                  <fnm>W-C</fnm>
               </au>
               <au>
                  <snm>Ledoux</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Rudnev</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Lash</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Fujibuchi</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Edgar</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Research</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>D562</fpage>
            <lpage>566</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">539976</pubid>
                  <pubid idtype="pmpid" link="fulltext">15608262</pubid>
                  <pubid idtype="doi">10.1093/nar/gki022</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Isolation of RNA from plant tissue</p>
            </title>
            <aug>
               <au>
                  <snm>Wilkins</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Smart</snm>
                  <fnm>LB</fnm>
               </au>
            </aug>
            <source>A laboratory guide to RNA: isolation, analysis, and synthesis</source>
            <publisher>New York: Wiley-Liss</publisher>
            <editor>Krieg PA</editor>
            <pubdate>1996</pubdate>
            <fpage>21</fpage>
            <lpage>41</lpage>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Statistical significance for genomewide studies</p>
            </title>
            <aug>
               <au>
                  <snm>Storey</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Tibshirani</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Proceedings of the National Academy of Sciences of the United States of America</source>
            <pubdate>2003</pubdate>
            <volume>100</volume>
            <fpage>9440</fpage>
            <lpage>9445</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">170937</pubid>
                  <pubid idtype="pmpid" link="fulltext">12883005</pubid>
                  <pubid idtype="doi">10.1073/pnas.1530509100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
