<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2202-9-66</ui>
   <ji>1471-2202</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Identification of a set of genes showing regionally enriched expression in the mouse brain</p>
         </title>
         <aug>
            <au id="A1" ca="yes" ce="yes">
               <snm>D'Souza</snm>
               <mi>A</mi>
               <fnm>Cletus</fnm>
               <insr iid="I1"/>
               <email>cdsouza@bcgsc.ca</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Chopra</snm>
               <fnm>Vikramjit</fnm>
               <insr iid="I1"/>
               <email>vchopra@bcgsc.ca</email>
            </au>
            <au id="A3">
               <snm>Varhol</snm>
               <fnm>Richard</fnm>
               <insr iid="I1"/>
               <email>rvarhol@bcgsc.ca</email>
            </au>
            <au id="A4">
               <snm>Xie</snm>
               <fnm>Yuan-Yun</fnm>
               <insr iid="I2"/>
               <email>yyxie@cmmt.ubc.ca</email>
            </au>
            <au id="A5">
               <snm>Bohacec</snm>
               <fnm>Slavita</fnm>
               <insr iid="I2"/>
               <email>slavita@cmmt.ubc.ca</email>
            </au>
            <au id="A6">
               <snm>Zhao</snm>
               <fnm>Yongjun</fnm>
               <insr iid="I1"/>
               <email>yzhao@bcgsc.ca</email>
            </au>
            <au id="A7">
               <snm>Lee</snm>
               <mi>LC</mi>
               <fnm>Lisa</fnm>
               <insr iid="I2"/>
               <email>Lisa.Lee@postgrad.manchester.ac.uk</email>
            </au>
            <au id="A8">
               <snm>Bilenky</snm>
               <fnm>Mikhail</fnm>
               <insr iid="I1"/>
               <email>mbilenky@bcgsc.ca</email>
            </au>
            <au id="A9">
               <snm>Portales-Casamar</snm>
               <fnm>Elodie</fnm>
               <insr iid="I2"/>
               <email>elodie@cmmt.ubc.ca</email>
            </au>
            <au id="A10">
               <snm>He</snm>
               <fnm>An</fnm>
               <insr iid="I1"/>
               <email>ahe@bcgsc.ca</email>
            </au>
            <au id="A11">
               <snm>Wasserman</snm>
               <mi>W</mi>
               <fnm>Wyeth</fnm>
               <insr iid="I2"/>
               <email>wyeth@cmmt.ubc.ca</email>
            </au>
            <au id="A12">
               <snm>Goldowitz</snm>
               <fnm>Daniel</fnm>
               <insr iid="I2"/>
               <email>dang@cmmt.ubc.ca</email>
            </au>
            <au id="A13">
               <snm>Marra</snm>
               <mi>A</mi>
               <fnm>Marco</fnm>
               <insr iid="I1"/>
               <email>mmarra@bcgsc.ca</email>
            </au>
            <au id="A14">
               <snm>Holt</snm>
               <mi>A</mi>
               <fnm>Robert</fnm>
               <insr iid="I2"/>
               <email>rholt@bcgsc.ca</email>
            </au>
            <au id="A15">
               <snm>Simpson</snm>
               <mi>M</mi>
               <fnm>Elizabeth</fnm>
               <insr iid="I2"/>
               <email>simpson@cmmt.ubc.ca</email>
            </au>
            <au id="A16">
               <snm>Jones</snm>
               <mi>JM</mi>
               <fnm>Steven</fnm>
               <insr iid="I1"/>
               <email>sjones@bcgsc.ca</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Genome Sciences Centre, British Columbia Cancer Agency, 570 West 7th Ave &#8211; Suite 100, Vancouver, BC, V5Z 4E6, Canada</p>
            </ins>
            <ins id="I2">
               <p>Centre for Molecular Medicine and Therapeutics, Child and Family Research Institute, Department of Medical Genetics, University of British Columbia, 950 West 28th Ave., Vancouver, BC, V5Z 4H4, Canada</p>
            </ins>
         </insg>
         <source>BMC Neuroscience</source>
         <issn>1471-2202</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>1</issue>
         <fpage>66</fpage>
         <url>http://www.biomedcentral.com/1471-2202/9/66</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">18625066</pubid>
               <pubid idtype="doi">10.1186/1471-2202-9-66</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>24</day>
               <month>12</month>
               <year>2007</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>14</day>
               <month>7</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>14</day>
               <month>7</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>D'Souza et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>The Pleiades Promoter Project aims to improve gene therapy by designing human mini-promoters (&lt; 4 kb) that drive gene expression in specific brain regions or cell-types of therapeutic interest. Our goal was to first identify genes displaying regionally enriched expression in the mouse brain so that promoters designed from orthologous human genes can then be tested to drive reporter expression in a similar pattern in the mouse brain.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>We have utilized LongSAGE to identify regionally enriched transcripts in the adult mouse brain. As supplemental strategies, we also performed a meta-analysis of published literature and inspected the Allen Brain Atlas <it>in situ </it>hybridization data. From a set of approximately 30,000 mouse genes, 237 were identified as showing specific or enriched expression in 30 target regions of the mouse brain. GO term over-representation among these genes revealed co-involvement in various aspects of central nervous system development and physiology.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>Using a multi-faceted expression validation approach, we have identified mouse genes whose human orthologs are good candidates for design of mini-promoters. These mouse genes represent molecular markers in several discrete brain regions/cell-types, which could potentially provide a mechanistic explanation of unique functions performed by each region. This set of markers may also serve as a resource for further studies of gene regulatory elements influencing brain expression.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The Pleiades Promoter Project (please see Availability &amp; requirements for more information) addresses two major challenges identified in gene therapy &#8211; first, the delivery of DNA to specific cell types to reduce side effects from treating healthy cells and second, controlled delivery of DNA to a specific locus in the genome to avoid insertional mutagenesis. The goal for the project is the generation of human DNA promoters less than 4 kb in length (mini-promoters) that drive gene expression in brain regions important in neurological conditions. To achieve this goal, we have first identified genes with enriched expression in different regions of the adult mouse brain. Regional expression patterns within the brain tend to be conserved between orthologous human and mouse genes <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Additionally, as regulatory sequences in tissue-specific genes tend to be highly conserved <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, human mini-promoters are expected to drive regional gene expression in transgenic mice based on earlier studies <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. Therefore, promoter regions from orthologous human genes will be assessed in the mouse brain for the ability to drive regional expression.</p>
         <p>Selection of the most optimal genes for promoter design necessitates detailed assessment of gene expression patterns. An invaluable resource to identify genes expressed in the mammalian brain is the serial analysis of gene expression (SAGE) technique <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>. A modern improvement of tag-based expression analysis is LongSAGE, which produces longer transcript tags (21-bp) better suited to unique mapping onto cDNA and genome sequences <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. As part of the Mouse Atlas of Gene Expression project <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>, LongSAGE was used to profile transcriptomes of 72 tissues of mouse strain C57BL/6J at various stages of development <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. For the Pleiades Promoter Project <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, a scion of the Mouse Atlas project, we have generated new LongSAGE data on gene expression in the adult mouse central nervous system to identify genes that display enriched expression in key brain regions.</p>
         <p>While LongSAGE provides a rich perspective on gene expression patterns, we extended our data mining efforts to include other large information sources. The PubMed database <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> provides an unparalleled compendium of text from the scientific literature. In order to facilitate extraction of key information from Medline abstracts or full-text articles in PubMed, natural language processing tools are routinely employed to semi-automate the process of literature mining <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. In this study we investigated an approach to specifically and automatically identify associations between genes and brain regions from the literature. We further analysed expression data from the Allen Brain Atlas (ABA; <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>), a high-throughput <it>in situ </it>hybridization platform that has assayed expression for ~20,000 genes in the adult mouse brain <abbrgrp><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr></abbrgrp>. Here, we report the successful utilization of a combination of gene-finding tools, including SAGE analysis, text mining and ABA expression data, to identify genes displaying regionally enriched expression in surrogate regions of therapeutic interest within the mouse brain.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Identification of brain region-enriched gene expression by LongSAGE</p>
            </st>
            <p>To identify regionally enriched gene expression within the brain of the adult mouse strain C57BL/6J, we used the precision of Laser Capture Microdissection (LCM; Figure <figr fid="F1">1</figr>) <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> to isolate component tissues and construct SAGE libraries from 17 brain regions as well as the whole adult mouse brain for comparison (Methods). As shown in Table <tblr tid="T1">1</tblr>, these libraries have been sampled to a depth of > 100,000 tags each, a level shown to be adequate for the discovery of medium-to-high level transcripts <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Bioinformatics analysis of differential gene expression was performed as described in Methods. Since the majority of transcripts were detected in multiple libraries, we employed a heuristic approach to identify and rank expression patterns (outlined in Table <tblr tid="T2">2</tblr>). For each brain region, we ranked genes from 1&#8211;91 based on the level and pattern of expression in descending order. Expression specificity of a ranked list of 1999 SAGE-identified genes was then confirmed by examining related literature information and Allen Brain Atlas <it>in situ </it>hybridization data. Based on this collective information, region-specific or region-enriched genes were further considered.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>List of adult brain region SAGE libraries</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="center">
                        <p>
                           <b>Name</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Description</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>No. of Genes</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Total Tags<sup>b</sup></b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM098</p>
                     </c>
                     <c ca="center">
                        <p>Whole brain<sup>a</sup></p>
                     </c>
                     <c ca="center">
                        <p>6893</p>
                     </c>
                     <c ca="center">
                        <p>108441</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM110</p>
                     </c>
                     <c ca="center">
                        <p>Hypothalamus</p>
                     </c>
                     <c ca="center">
                        <p>6676</p>
                     </c>
                     <c ca="center">
                        <p>108882</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM132</p>
                     </c>
                     <c ca="center">
                        <p>Ventral Thalamus</p>
                     </c>
                     <c ca="center">
                        <p>6441</p>
                     </c>
                     <c ca="center">
                        <p>105701</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM137</p>
                     </c>
                     <c ca="center">
                        <p>Hippocampus Dentate Gyrus, dorsal/anterior</p>
                     </c>
                     <c ca="center">
                        <p>5935</p>
                     </c>
                     <c ca="center">
                        <p>104322</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM139</p>
                     </c>
                     <c ca="center">
                        <p>Medial Thalamus</p>
                     </c>
                     <c ca="center">
                        <p>6608</p>
                     </c>
                     <c ca="center">
                        <p>105364</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM147</p>
                     </c>
                     <c ca="center">
                        <p>Visual Cortex Layers II/III/IV</p>
                     </c>
                     <c ca="center">
                        <p>6683</p>
                     </c>
                     <c ca="center">
                        <p>136039</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM152</p>
                     </c>
                     <c ca="center">
                        <p>Substantia Nigra</p>
                     </c>
                     <c ca="center">
                        <p>6584</p>
                     </c>
                     <c ca="center">
                        <p>115991</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM153</p>
                     </c>
                     <c ca="center">
                        <p>Basal Nucleus of Meynert</p>
                     </c>
                     <c ca="center">
                        <p>6581</p>
                     </c>
                     <c ca="center">
                        <p>120997</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM180</p>
                     </c>
                     <c ca="center">
                        <p>Locus Coeruleus</p>
                     </c>
                     <c ca="center">
                        <p>6282</p>
                     </c>
                     <c ca="center">
                        <p>102933</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM181</p>
                     </c>
                     <c ca="center">
                        <p>Raphe Nuclei</p>
                     </c>
                     <c ca="center">
                        <p>6434</p>
                     </c>
                     <c ca="center">
                        <p>104627</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM182</p>
                     </c>
                     <c ca="center">
                        <p>Cerebellum White Matter</p>
                     </c>
                     <c ca="center">
                        <p>5461</p>
                     </c>
                     <c ca="center">
                        <p>107335</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM183</p>
                     </c>
                     <c ca="center">
                        <p>Primary Motor Cortex</p>
                     </c>
                     <c ca="center">
                        <p>6543</p>
                     </c>
                     <c ca="center">
                        <p>115262</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM184</p>
                     </c>
                     <c ca="center">
                        <p>Hippocampus CA1, dorsal/anterior</p>
                     </c>
                     <c ca="center">
                        <p>6331</p>
                     </c>
                     <c ca="center">
                        <p>118198</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM193</p>
                     </c>
                     <c ca="center">
                        <p>Amygdala, basolateral complex</p>
                     </c>
                     <c ca="center">
                        <p>6396</p>
                     </c>
                     <c ca="center">
                        <p>109772</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM194</p>
                     </c>
                     <c ca="center">
                        <p>Amygdala, central nucleus</p>
                     </c>
                     <c ca="center">
                        <p>6451</p>
                     </c>
                     <c ca="center">
                        <p>110056</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM195</p>
                     </c>
                     <c ca="center">
                        <p>Dorsal striatum</p>
                     </c>
                     <c ca="center">
                        <p>6185</p>
                     </c>
                     <c ca="center">
                        <p>105509</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM196</p>
                     </c>
                     <c ca="center">
                        <p>Cerebellum, Purkinje Cell Layer</p>
                     </c>
                     <c ca="center">
                        <p>6604</p>
                     </c>
                     <c ca="center">
                        <p>104850</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>SM201</p>
                     </c>
                     <c ca="center">
                        <p>Ependymal and Subependymal Layers</p>
                     </c>
                     <c ca="center">
                        <p>6561</p>
                     </c>
                     <c ca="center">
                        <p>107041</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a</sup>Manually dissected; all others were laser capture microdissected</p>
                  <p><sup>b</sup>Represents filtered data</p>
               </tblfn>
            </tbl>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Rank order based on the level and pattern of gene expression</p>
               </caption>
               <tblbdy cols="2">
                  <r>
                     <c ca="center">
                        <p>
                           <b>Rank Order</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Expression Pattern</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="2">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1 TL* and 0 OTL* (<it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05) (TL tag count > = 5)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>2&#8211;6</p>
                     </c>
                     <c ca="center">
                        <p>1 TL and 1&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>7&#8211;11</p>
                     </c>
                     <c ca="center">
                        <p>1 TL and 1&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>OTL </it></sub>> 0.05) (TL tag count > = 5, OTL tag count: 1&#8211;4)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>12&#8211;17</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs and 0&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>18&#8211;22</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs and 1&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>> 0.05) (TL tag count > = 5, OTL tag count: 1&#8211;4)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>23&#8211;28</p>
                     </c>
                     <c ca="center">
                        <p>3 TLs and 0&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>29&#8211;33</p>
                     </c>
                     <c ca="center">
                        <p>3 TLs and 1&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL</it></sub>> 0.05) (TL tag count > = 5, OTL tag count: 1&#8211;4)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>34&#8211;39</p>
                     </c>
                     <c ca="center">
                        <p>4 TLs and 0&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL</it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>40&#8211;44</p>
                     </c>
                     <c ca="center">
                        <p>4 TLs and 1&#8211;5 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>> 0.05) (TL tag count > = 5, OTL tag count: 1&#8211;4)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>45&#8211;55</p>
                     </c>
                     <c ca="center">
                        <p>1 TL and 6&#8211;16 OTLs (<it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>56&#8211;65</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs and 6&#8211;15 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>66&#8211;74</p>
                     </c>
                     <c ca="center">
                        <p>3 TLs and 6&#8211;14 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>75&#8211;82</p>
                     </c>
                     <c ca="center">
                        <p>4 TLs and 6&#8211;13 OTLs (<it>P</it><sub><it>TL</it>-<it>TL </it></sub>> 0.05; <it>P</it><sub><it>TL</it>-<it>OTL </it></sub>&lt; = 0.05)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>83</p>
                     </c>
                     <c ca="center">
                        <p>1 TL with 4 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>84</p>
                     </c>
                     <c ca="center">
                        <p>1 TL with 3 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>85</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs with 4 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>86</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs with 3 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>87</p>
                     </c>
                     <c ca="center">
                        <p>1 TL with 2 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>88</p>
                     </c>
                     <c ca="center">
                        <p>2 TLs with 2 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>89</p>
                     </c>
                     <c ca="center">
                        <p>3 TLs with 3 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>90</p>
                     </c>
                     <c ca="center">
                        <p>3 TLs with 2 tags</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>91</p>
                     </c>
                     <c ca="center">
                        <p>1 TL with 1 tag</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>* TL = Target library (brain region of interest), OTL = Off-target library (background region)</p>
               </tblfn>
            </tbl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Use of Laser Capture Microdissection to isolate the hippocampus dentate gyrus from an adult mouse</p>
               </caption>
               <text>
                  <p><b>Use of Laser Capture Microdissection to isolate the hippocampus dentate gyrus from an adult mouse</b>. A) Intact coronal brain section at ~Bregma -1.35 stained with cresyl violet. B &amp; C) dentate gyrus (DG) has been microdissected with laser. D) dentate gyrus has been isolated and captured for total RNA extraction and construction of SAGE libraries. Images were captured using a Sony DXC-390P 3-CCD color video camera attached to a Nikon Eclipse TE2000-S microscope (10&#215; magnification). Scale bar = 100 &#956;m. D: dorsal; V: ventral.</p>
               </text>
               <graphic file="1471-2202-9-66-1"/>
            </fig>
            <p>Of the 237 genes identified as displaying regionally enriched expression in this study, 132 genes [see Additional file <supplr sid="S1">1</supplr>] displayed expression patterns listed in Table <tblr tid="T2">2</tblr>. Only 22 genes were found in a single library and five of these (A930006D11Rik, <it>Chrna6</it>, <it>Gdf10</it>, <it>Hcrt</it>, and <it>Hes3</it>) were determined to be tissue-specific at a statistically significant level (tag counts > 5, <it>P </it>&lt; 0.05).</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p>Compilation of SAGE data for 237 regionally enriched genes.</p>
               </text>
               <file name="1471-2202-9-66-S1.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Complexity of the adult mouse brain transcriptome and SAGE-based analysis of transcriptome similarity of brain regions</p>
            </st>
            <p>As an indication of complexity of the adult mouse brain transcriptome, within the 18 Pleiades libraries (including whole adult brain library) expression was observed for 11,836 genes of the total 17,098 genes detectable within the Mouse Atlas (total number of tags mapped to the Mouse Atlas libraries was approximately 8.8 million including singletons). In contrast, the Allen Brain Atlas (ABA) contains expression patterns of approximately 16,000 genes across the entire adult C57BL/6J mouse brain (Susan Sunkin, ABA, personal communication); of these genes, roughly 65.5% (10,479/16,000) were detectable in the 18 Pleiades libraries. Furthermore, the Pleiades libraries provided about 8% (1,357/17,357) additional genes to the total number of genes detectable by ABA.</p>
            <p>We also analyzed SAGE data to measure transcriptome similarity between selected tissues. The premise was that tissues would cluster together or diverge based on the degree to which their genes are differentially expressed. Hierarchical clustering was done based on unweighted average distance between formed clusters (see description in Methods), the results of which are displayed in the form of a dendrogram (Figure <figr fid="F2">2</figr>). A pattern of divergent tissue clusters consistently emerges: a cluster of neuronal tissues and several discrete single tissue clusters including Ependymal Layers, Cerebellum White Matter and Cerebellum Purkinje Cell Layer. Among neuronal tissues, the Ventral and Medial Thalamus consistently clustered tightly together and had the lowest expression divergence between any two pairs of tissues. Additionally, Visual Cortex, Primary Motor Cortex, Amygdala (basolateral), Amygdala (central), and Dorsal Striatum also clustered together. Segregation of the Ependymal tissue into a separate single cluster makes sense given its non-neuronal nature <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>, and the Cerebellar White Matter is composed of myelinated axonal processes. Clustering is usually sensitive to the specific expression divergence measure used. However, we tried several empirical measures, as well as different <it>P </it>values for selecting differentially expressed genes, and observed that the main pattern of clustering outlined above remains unchanged.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Transcriptome similarity among 17 brain tissues based on expression divergence at <it>P </it>value = 0.01</p>
               </caption>
               <text>
                  <p><b>Transcriptome similarity among 17 brain tissues based on expression divergence at <it>P </it>value = 0.01</b>. Tissues being compared are indicated on the Y-axis, and expression divergence (ED<sub><it>P</it></sub>) of clusters of tissues is plotted on the X-axis. At each node in the dendrogram, the number of genes shared between libraries in the tissue cluster is indicated. A threshold of 50% of maximum ED<sub><it>P </it></sub>was chosen for coloring of branch lines in the dendrogram.</p>
               </text>
               <graphic file="1471-2202-9-66-2"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Literature mining strategy to rapidly identify genes associated with brain regions of interest</p>
            </st>
            <p>We included in the present analysis several additional brain regions and cell-types, for example, Blood-Brain Barrier, Barrington's Nucleus, Astroglia etc., for which SAGE libraries had not been constructed. Therefore, to expand our set of genes with regionally enriched expression for all brain regions, we then scrutinized literature from PubMed. We obtained a list of Medline records using Boolean logic with search term combinations indicated in Table <tblr tid="T3">3</tblr>. To facilitate retrieval of publications from a large literature database such as PubMed, we also developed a semi-automated literature mining strategy (see Methods and Figure <figr fid="F3">3</figr>) based on natural language processing. In this approach we looked for the appearance of a gene name or synonym and a brain region in a sentence. Of the 99.7 million sentences searched, 314,515 occurrences of a brain region term were found; 4,395 mouse genes names, or the names of their human orthologs, were found to appear within the same sentence as a brain region (not shown).</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Boolean search terms to obtain Medline records with information about region-associated expression or promoter characterization</p>
               </caption>
               <tblbdy cols="1">
                  <r>
                     <c ca="left">
                        <p>Gene AND brain AND in situ [qualifiers: Mouse/Human]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND brain region AND in situ</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND regulation</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND promoter</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND promoter AND brain</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND promoter AND brain region</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND promoter AND transgenic mice</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene AND promoter AND reporter (qualifiers: CAT/Luciferase/Gfp)</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Text mining data flow</p>
               </caption>
               <text>
                  <p><b>Text mining data flow</b>. This shows the steps by which the medical sentence parser retrieves Medline records that contain expression information for a gene in a specific region of the brain.</p>
               </text>
               <graphic file="1471-2202-9-66-3"/>
            </fig>
            <p>The candidature of literature-mined genes was verified by assessing available expression data (reporter gene expression, microarray expression profile, radioactive/non-radioactive <it>in situ </it>hybridization) in publications, and confirmed with <it>in situ </it>hybridization data from the Allen Brain Atlas (see below). In addition to promoter-reporter fusion data from the literature, reporter expression data for BAC (Bacterial Artificial Chromosome) transgenic mice, when available from the GENSAT database <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, was also considered as complementary evidence of expression [see Additional file <supplr sid="S2">2</supplr>].</p>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p>Summary of expression profiles of region-specific or enriched genes by subanatomical region.</p>
               </text>
               <file name="1471-2202-9-66-S2.doc">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Data mining genes showing regionally enriched expression from Allen Brain Atlas</p>
            </st>
            <p>The entire Allen Brain Atlas (ABA) data set can be searched via a web-based application <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. We used this feature to examine expression patterns of genes identified as regionally enriched by SAGE and/or the literature. This verification was particularly apt for SAGE because ABA <it>in situ </it>hybridization patterns were also derived from the same mouse strain C57BL/6J. We also employed the ABA Anatomic Search tool to identify additional genes whose expression patterns cluster within brain regions of interest. While this approach short-listed genes for major regions (Thalamus, Cerebral Cortex etc.) of the mouse brain listed under Anatomic Search, we also searched within these regions to identify expression in sub-regions of interest, e.g. within Pons for genes expressed in Locus Coeruleus. Recent introduction of the alternative ABA search tool, NeuroBlast, also proved to be useful. We used NeuroBlast to retrieve genes co-expressed with a seeded (query) gene in a region of interest. Identification of regionally enriched co-expressed genes in this manner is indispensable in subsequent identification of shared regulatory elements for efficient mini-promoter design.</p>
            <p>Thus, SAGE analysis of the adult mouse brain transcriptome combined with meta-analysis using data mining resources described above identified 237 genes as showing regionally enriched expression (Table <tblr tid="T4">4</tblr>). A summary of the meta-analysis that supports regionally enriched expression is presented [see Additional file <supplr sid="S2">2</supplr>]; where available, this file includes examples of supporting ABA images downloaded from the ABA website (please see Availability &amp; requirements for more information)</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>List of regionally enriched genes in 30 brain regions and cell-types of therapeutic interest</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>
                           <b>Brain Regions/Cell types</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Example Processes/Disease Associations</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Genes</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cortex</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease, Amyotropic Lateral Sclerosis, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>B3galt2, 3110035E14Rik, Ccl27, Ctgf, Emx1, Fhl2, Klf10, Myl4, Rbp4, Rtn4rl2, Stx1a, Tbr1, Vip, Ddit4l, Dkkl1, Rspo2, Ier5, Igfbp6, Ephb6, Mpped1, Pak7, Satb2, Cplx3, E430002G05Rik</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hippocampus</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease Adult Neurogenesis, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Htr1A, Tgfb2, Gria1, Nr3c2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hippocampus, Ammon's Horn</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease Adult Neurogenesis, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Hunk, Klk8, Gpr161, Arfrp2, C630041L24Rik, Slc9a2, Neurod6, Pkp2, Fibcd1, Sstr4</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hippocampus, Dentate Gyrus</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease Adult Neurogenesis, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Gabrd, Prox1, Dsp, C78409, Lct, Crlf1, Tdo2, A330019N05Rik, Lrrtm4, Htr4, Tspan18</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Neurogenic Regions</p>
                     </c>
                     <c ca="left">
                        <p>Adult Neurogenesis</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Nr2e1, Dcx, Mki67, Vim, Dlx2, Nes, Dlx1, Dscam, Fabp7, Igfbpl1, Lrrn1, Rrm1, Sox2, Thbs4</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Striatum</p>
                     </c>
                     <c ca="left">
                        <p>Huntington Disease, Parkinson Disease, Plasticity in Depression</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Adora2a, Gpr88, Drd1a, Drd2, Gpr6, Rgs9, Adcy5, Crym, Foxp1, Lpl, Pde1b1, Pdyn, Rarb, Rasd2, Tgfa</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Amygdala</p>
                     </c>
                     <c ca="left">
                        <p>Huntington Disease, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Tac1, Cyp26b1, Hap1, Cdh9, Ptprc, Gabra2, Hgf, Pdzrn3, Plxnd1, Wwox, Rasal1, Dock10, Prkcd</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Amygdala, Basolateral Complex</p>
                     </c>
                     <c ca="left">
                        <p>Huntington Disease, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Grp, Nov, Nr2f2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Amygdala, Central Nucleus</p>
                     </c>
                     <c ca="left">
                        <p>Huntington Disease, Depression, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Atp6v1c2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Thalamus</p>
                     </c>
                     <c ca="left">
                        <p>Huntington Disease</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Ramp3, Rgs16, Slitrk6, Tnnt1, 1110069I04Rik Amotl1, Rab37, Sh3d19, Grid2ip, Lef1, Plekhg1, Syt9, Tcf7l2, Gm804, Gja7, Socs6, Vangl1</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hypothalamus</p>
                     </c>
                     <c ca="left">
                        <p>Cancer</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Hcrt, Gpx3, Trh, Fezf1, Agrp, Calcr, Ghrh, Npy, Pmch, Pomc</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cerebellum, Granule Cells</p>
                     </c>
                     <c ca="left">
                        <p>Medulloblastoma, Ataxia, Cerebellar hypoplasia</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Gabra6, Cbln3</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cerebellum, Purkinje Cell Layer</p>
                     </c>
                     <c ca="left">
                        <p>Spinocerebellar Ataxia, Autism, Plasticity</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Pcp2, Hbegf, Icmt, Atp2a3, Casq2, Gdf10, Grid2, Hes3, Lhx1, Ptprm, A930006D11Rik</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Basal Nucleus of Meynert</p>
                     </c>
                     <c ca="left">
                        <p>Acetylcholine System, Alzheimer Disease</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Gal, Ngfr, Tac2, Lhx8, Ecel1, Gbx1, Lancl3, Ntrk1</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Substantia Nigra</p>
                     </c>
                     <c ca="left">
                        <p>Dopamine System, Parkinson Disease</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Ddc, Slc6a3, Ntsr1, Pitx3, Aldh1a1, Chrna6, Chrnb3, Th</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Raphe Nuclei</p>
                     </c>
                     <c ca="left">
                        <p>Norepinephrine System, Depression</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Fev, Gchfr, Slc6a4, Slc17a8, Tph2, Maob, Esr2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Locus Coeruleus</p>
                     </c>
                     <c ca="left">
                        <p>Serotonin System, Depression</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Dbh, Maoa, Slc6a2, Slc18a2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Astroglia</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Gfap, S100b, Slc1a2, Plaur, Gcm1, Gcm2, Serpina3n</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Microglia (activated)</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease, Amyotropic Lateral Sclerosis</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Cd68, Aif1, P2rx7, Sulf2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Microglia (constitutive)</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Cx3cr1, Itgam</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Oligodendroglia</p>
                     </c>
                     <c ca="left">
                        <p>Alzheimer Disease, Multiple Sclerosis</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Olig1, Ugt8a, Cnp, Gjb1, Klk6, Mag, Apod, Enpp2, Fa2h, Mal, Mbp, Mobp, Mog, Olig2, Pllp, Plp1, Sox10, Tmem63a</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Barrington's Nucleus</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Crh, Fgfr1</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Brainstem, Pons and Medulla</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Slc6a5, Glra1, Pogz, Anxa4, Spp1, Esr1, Pou4f1, Slc4a2, Stac</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cortex, Anterior Cingulate</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p><it>Egr1, Stmn1, Cckbr</it>,<it>Adcy1</it></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cortex, Somatosensory</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Rspo1, Cyp39a1, Cartpt, Col5a1, Rorb, Loc433228, Gnb4</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cortex, Insula</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Lxn, Ntng2, Nr4a2, Fezf2, Ttc9b</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hypothalamus, Paraventricular Nucleus</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Avp, Oxt</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Subthalamic Nucleus</p>
                     </c>
                     <c ca="left">
                        <p>Pain</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Pitx2, Lmx1b</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Blood Brain Barrier</p>
                     </c>
                     <c ca="left">
                        <p>Drug therapy</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>Abcb1a, Cldn5, Ednra, Fcgrt, Hspa12b, Lrp10, Lrp8, Rage, Slc2a1, Slc7a5, Slco1c1, Slc6a12, Slc28a2</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GABAergic neurons</p>
                     </c>
                     <c ca="left">
                        <p>Schizophrenia, Bipolar Disorder</p>
                     </c>
                     <c ca="left">
                        <p><it>Vip</it>*, <it>Gpr88</it><sup>&#8225;</sup></p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*also listed as a cortex-specific gene</p>
                  <p><sup>&#8225;</sup>also listed as a striatum-specific gene</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Identification of over-represented GO terms among genes with region-enriched expression</p>
            </st>
            <p>The Gene Ontology (GO) resource <abbrgrp><abbr bid="B19">19</abbr></abbrgrp> is a powerful tool to identify common functions shared by genes identified by high-throughput gene expression methods such as SAGE. We searched for over-representation of GO terms among our set of genes from each of three ontology classes: Biological Process, Molecular Function and Cellular Component (Methods). Of 237 genes in our selection, we found annotations for 216 genes in the whole mouse genome set of 18535 annotated genes (as of March 18, 2008). From this list, we determined the top 12 statistically over-represented GO terms [see Additional file <supplr sid="S3">3</supplr>]. Annotations for the test selection of genes were compared with GO annotations of the whole mouse genome. Significant biological processes involved nervous system development, transmission of nerve impulse, cell-cell signaling, neurogenesis, behavior etc. Significant molecular functions involved neuropeptide hormone activity, sequence-specific DNA binding, neurotransmitter receptor activity, steroid hormone receptor activity, neurotransmitter transporter activity etc. Products of some of these genes also tended to be localized in the extracellular region, plasma membrane, synapse, or within transcription factor complexes. Thus, it appears that many of the genes we identified have established neurological functions, which accounts for their regionally enriched expression. It is noteworthy that we found 28 transcription factor encoding genes representing 16 of 30 regions/cell-types of interest (Table <tblr tid="T5">5</tblr>). This information combined with identification of regulatory sequences within promoters of selected genes will aid the design of mini-promoters specific for each brain region. Because our selection of the 237 genes was biased towards those with known functions, we also carried out GO analysis on genes expressed in each of 18 SAGE libraries [see Additional file <supplr sid="S4">4</supplr>]. Specific neurological functions were less apparent among over-represented GO terms for these larger sets than for the 237 genes presented in this study.</p>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p>Top 12 over-represented GO terms in each ontology category among the 237 regionally enriched genes.</p>
               </text>
               <file name="1471-2202-9-66-S3.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p>Top 10 over-represented GO terms in each ontology category among the genes in each of 18 SAGE libraries.</p>
               </text>
               <file name="1471-2202-9-66-S4.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <tbl id="T5">
               <title>
                  <p>Table 5</p>
               </title>
               <caption>
                  <p>Regionally enriched genes encoding transcription factors</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="center">
                        <p>
                           <b>Gene</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Transcription Factor Description</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Associated Brain Region</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Nr2f2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Nuclear receptor subfamily 2, group F, member 2</p>
                     </c>
                     <c ca="center">
                        <p>Amygdala, Basolateral Complex</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Gbx1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Gastrulation brain homeobox 1</p>
                     </c>
                     <c ca="center">
                        <p>Basal Nucleus of Meynert</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Lhx8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>LIM homeobox protein 8</p>
                     </c>
                     <c ca="center">
                        <p>Basal Nucleus of Meynert</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Esr1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Estrogen receptor 1</p>
                     </c>
                     <c ca="center">
                        <p>Brainstem (Pons and Medulla)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Pou4f1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>POU domain, class 4, transcription factor 1</p>
                     </c>
                     <c ca="center">
                        <p>Brainstem (Pons and Medulla)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Lhx1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>LIM homeobox protein 1</p>
                     </c>
                     <c ca="center">
                        <p>Cerebellum, Purkinje Cell Layer</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Emx1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Empty spiracles homeobox 1</p>
                     </c>
                     <c ca="center">
                        <p>Cortex</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Tbr1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>T-box brain gene 1</p>
                     </c>
                     <c ca="center">
                        <p>Cortex</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Egr1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Early growth response 1/Zinc finger protein 225</p>
                     </c>
                     <c ca="center">
                        <p>Cortex, Anterior Cingulate</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Nr4a2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Nuclear receptor subfamily 4, group A, member 2</p>
                     </c>
                     <c ca="center">
                        <p>Cortex, Insula</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Nr3c2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Nuclear receptor subfamily 3, group C, member 2</p>
                     </c>
                     <c ca="center">
                        <p>Hippocampus</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Neurod6</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Neurogenic differentiation 6; Basic HLH transcription factor</p>
                     </c>
                     <c ca="center">
                        <p>Hippocampus, Ammon's Horn</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Dlx1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Distal-less homeobox 1</p>
                     </c>
                     <c ca="center">
                        <p>Neurogenic</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Dlx2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Distal-less homeobox 2</p>
                     </c>
                     <c ca="center">
                        <p>Neurogenic</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Nr2e1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Nuclear receptor subfamily 2, group E, member 1</p>
                     </c>
                     <c ca="center">
                        <p>Neurogenic</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Sox2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>SRY (sex determining region Y)-box 2</p>
                     </c>
                     <c ca="center">
                        <p>Neurogenic</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Esr2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Estrogen receptor 2</p>
                     </c>
                     <c ca="center">
                        <p>Raphe Nuclei</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Foxp1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Forkhead box P1</p>
                     </c>
                     <c ca="center">
                        <p>Striatum</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Rarb</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Retinoic acid receptor, beta:</p>
                     </c>
                     <c ca="center">
                        <p>Striatum</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Pitx3</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Paired-like homeodomain transcription factor 3</p>
                     </c>
                     <c ca="center">
                        <p>Substantia Nigra</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Lmx1b</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>LIM homeobox transcription factor 1, beta</p>
                     </c>
                     <c ca="center">
                        <p>Subthalamic Nucleus</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Pitx2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Paired-like homeodomain transcription factor 2</p>
                     </c>
                     <c ca="center">
                        <p>Subthalamic Nucleus</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Lef1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Lymphoid enhancer binding factor 1</p>
                     </c>
                     <c ca="center">
                        <p>Thalamus</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Tcf7l2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Transcription factor 7-like 2 (T-cell specific, HMG-box)</p>
                     </c>
                     <c ca="center">
                        <p>Thalamus</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Gcm1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Glial cells missing homolog 1</p>
                     </c>
                     <c ca="center">
                        <p>White Matter &#8211; Glia, Astrocytes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Gcm2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Glial cells missing homolog 2</p>
                     </c>
                     <c ca="center">
                        <p>White Matter &#8211; Glia, Astrocytes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Olig1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Oligodendrocyte transcription factor 1</p>
                     </c>
                     <c ca="center">
                        <p>White Matter &#8211; Glia, Oligodendroglia</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Olig2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>Oligodendrocyte transcription factor 2</p>
                     </c>
                     <c ca="center">
                        <p>White Matter &#8211; Glia, Oligodendroglia</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <it>Sox10</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>SRY (sex determining region Y)-box 10</p>
                     </c>
                     <c ca="center">
                        <p>White Matter &#8211; Glia, Oligodendroglia</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>Targeting gene therapy to specific regions of the brain requires the application of well-defined promoters that can drive expression in a region-specific manner. In this study our goal was to identify regionally enriched transcripts in sub-structures/cell-types of the mouse brain with a particular focus on those brain regions associated with diseases. We were encouraged by findings from the ABA project that above background level expression was found for ~80% of genes assayed &#8211; and approximately 70% of genes have been localized to fewer than 20% of all brain cells &#8211; suggesting that gene expression is clustered in small brain regions <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. For a variety of reasons we believe that human orthologs of regionally enriched mouse genes would be good candidates to design promoters from. First, at the genomic level, approximately 99% of mouse genes have an ortholog in the human genome <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. Second, it has been shown that 84% of human-mouse orthologous gene pairs show significantly lower expression divergence than that of random gene pairs <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. In another comparable study within the milieu of neurogenomics, it was demonstrated that there are significant constraints on the evolution of gene expression and nucleotide sequence of region-specific genes in the brains of humans and mice <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. In general, transcripts that are regionally enriched in mice also appear to be regionally enriched in humans &#8211; further emphasizing conservation of mammalian brain gene expression. Nonetheless, we are exercising caution in assuming global conservation of expression across species as divergent as mouse and human, and will be testing multiple candidate genes for each region.</p>
         <p>Our study profiles region-enriched gene expression within 17 key areas of the adult mouse brain by LongSAGE analysis. For the small number of brain regions for which we had no SAGE data we interrogated the literature and the ABA directly. We used several expression indicators including SAGE tag abundance and specificity, <it>in situ </it>hybridization, promoter-reporter fusion data etc. to assess candidacy of genes. Our data mining strategy was to start with SAGE-identified genes ranked on the basis of specificity and expression level, confirmed with supporting evidence from the literature, ABA or GENSAT. Although we prioritized finding genes displaying absolute regional specificity (no detectable background expression), for our data mining strategy to be practicable we did not limit ourselves to this level of stringency &#8211; especially for the brain nuclei e.g. Basal Nucleus of Meynert, Barrington's Nucleus etc. Therefore, we also selected genes that displayed the highest level of regional enrichment with the idea that promoters of such genes can be manipulated to produce desired specificity of expression, as reported by Machon et al. for the mouse <it>Dach1 </it>gene <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. Compared to ubiquitous expression of the native <it>Dach1 </it>gene, a transgene with 5.8 kb of <it>Dach1 </it>regulatory sequence restricts &#946;-galactosidase reporter expression within the mouse brain to the neocortex. Deletion analysis of this 5.8 kb fragment further delimited cortex-specific activity to a minimal 2.5 kb promoter region. From a total of about 30,000 mouse genes <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, we have identified a set of 237 genes displaying regional enrichment of expression.</p>
         <p>Analysis of SAGE data to delineate transcriptome similarity among 17 selected brain tissues revealed segregation of a large cluster of neuronal tissues from discrete single clusters of non-neuronal tissues (Ependymal tissue and the highly myelinated Cerebellar White Matter tissue) and the neuronal outlier Cerebellar Purkinje Cell Layer. This pattern of tissue clustering appears to be borne out by unique tissue composition at the very least. Among neuronal tissues, tight clustering of the Ventral and Medial Thalamus regions is possibly a reflection of common diencephalic origin, although from a functional standpoint the two tissues can be considered to be different. The expression signature of a tissue may either independently confer tissue uniqueness, or itself depend on unique tissue composition, the surrounding cellular environment, or a combination of factors.</p>
         <p>Other studies have also demonstrated the utility of gene expression patterns in assessing cytoarchitectural distinctness of rodent brain regions. During review of this manuscript another study was published that employed SAGE gene expression profiling to identify region expression in 11 regions of the adult mouse brain <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. Interestingly, regional enrichment of some transcripts was found to be conserved in the human brain. Microarray analysis of gene expression patterns in 24 neural tissues in the mouse central nervous system has mapped discrete brain domains based on such expression patterns <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. Importantly, it was revealed that embryological imprinting is still evident in the adult brain. Microarray analysis has similarly identified molecular markers for neuronal subtypes in the adult mouse forebrain <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>, in brain regions in each of eight strains of inbred mice <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>, as well as in the adult rat CNS <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>. Fang et al. have shown that the most regionally discriminative genes are associated with one of four specific factors: regional myelin/oligodendrocyte levels, resident neuron types, neurotransmitter innervation profiles, and Ca<sup>+2</sup>-dependent signaling and second messenger systems <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>.</p>
         <p>By assessing over-representation of GO terms within our set of regionally expressed genes, we identified commonalities in molecular functions, cellular locations and involvement in key biological processes. This offers the promise of a unique set of molecular markers for each region/cell-type, and could potentially provide a mechanistic explanation of unique functions performed by discrete brain regions. Because of the disease application of our work, we were assured by the over-representation of genes involved in neurotransmitter synthesis, reception and degradation. Importantly, we have also identified many regionally expressed transcription factor-encoding genes. This is consistent with previous findings of Suzuki et al. who have identified region-specific transcription factors in 11 mouse brain regions by using medium-scale real-time RT-PCR <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>.  They reported that 90% of known transcription factors display significant expression in at least one brain region. Additionally, it was found that 349 of over 1000 transcription factor and co-regulator genes, mapped by <it>in situ </it>hybridization in the brains of developing mice, show restricted expression patterns adequate to describe the anatomical organization of the mouse brain <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. </p>
         <p>The identification of brain region-specific transcription factors is a prelude to explaining expression patterns of similarly enriched genes regulated by these factors. Armed with this knowledge, we can now search for evidence of transcription factor co-regulation of genes by availing of existing repositories of regulatory sequence collections <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr><abbr bid="B33">33</abbr></abbrgrp>. In particular, the PAZAR system <abbrgrp><abbr bid="B33">33</abbr></abbrgrp> has been employed to integrate transcription factor data and annotated regulatory sequences from the Pleiades Promoter Project. Additionally, given that much is already known about pathways that activate transcription factors, it would now be possible to identify pathways with which genes regulated by these transcription factors are associated. Indeed, a regulatory network comprising 15 important basic helix-loop-helix transcription factors and 153 target genes within the mouse brain has now been constructed <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. From the perspective of the Pleiades Promoter Project, the identification of DNA-binding elements, transcription factors and pathways influencing their interaction will stand in good stead for efficient mini-promoter design.</p>
         <p>We encountered challenges during in this study that are deserving of mention. In literature mining, curation was obfuscated by the existence of numerous synonyms for either mouse or human genes, references to a single protein rather than two distinct isoforms, or different genes with the same synonym. Furthermore, where genes were not represented on either ABA or GENSAT it was not possible to confirm expression, but nonetheless such genes were retained based on level and specificity of expression indicated by the literature or SAGE. Additionally, for a good number of genes there was low correlation between expression detected by SAGE and <it>in situ </it>hybridization. Despite the depth of sampling, expression of many genes was not detected by our SAGE procedure; for e.g <it>Pde1b1</it>, which has been shown to be strongly expressed in the striatum by <it>in situ </it>hybridization on ABA and in the literature <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. Also, <it>Hcrt </it>appeared to be Hypothalamus-specific by SAGE but ABA indicated enrichment in the Hypothalamus with low level, widespread background expression. Although our SAGE procedure and ABA <it>in situ </it>hybridization profiled gene expression from the same mouse strain C57BL/6J, lack of correlation between the two could be due to inherent differences in the way RNA is processed and/or detected in these procedures. Nonetheless, <it>Hcrt </it>was retained in our study after considering significance of expression in SAGE analysis (<it>P </it>value = 0) and the description of minimal promoters in the literature <abbrgrp><abbr bid="B36">36</abbr><abbr bid="B37">37</abbr></abbrgrp>.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>We have successfully identified genes displaying region-enriched expression in the mouse brain by the application of SAGE and data mining from a variety of publicly available sources. These genes represent useful molecular markers that could potentially aid in unraveling the functions of representative brain regions/cell-types. Importantly, for the Pleiades Promoter Project, identification of these genes has brought us closer to our goal of designing well-defined human promoters for gene therapy. Indeed, we have further identified promoters of human orthologs of a subset of these mouse genes, and are now gearing up to test expression of reporter genes in transgenic mice (unpublished data). Ultimately, it will be of great interest to determine for how many of these promoters the mouse pattern of regional enrichment is recapitulated within the human brain, and which of these successfully remediate the disorders they may be designed for.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Mice</p>
            </st>
            <p>Mice used in our experiments were all adult male C57BL/6J mice (12-week old post-natal). All procedures used in these experiments were in accordance with the Canada Council on Animal Care and approved by the University of British Columbia Animal Care Committee (A05-1748). All experiments were conducted in accordance with Canadian and International standards for animal care. All efforts were made to minimize the number and suffering of any animals used in these experiments.</p>
         </sec>
         <sec>
            <st>
               <p>Whole brain manual dissection and RNA extraction</p>
            </st>
            <p>Whole brains were manually dissected at room temperature from the intact bodies of mice. To minimize the effects of stress on gene expression, the mother, and the entire litter remained in the family cage until harvest. Mice were removed, one at a time and killed in a separate room, by cervical dislocation. Tissue was immediately flash frozen in liquid nitrogen and stored at -80&#176;C until further processing. Frozen tissue was disrupted and homogenized for 30 seconds with a Polytron<sup>&#174; </sup>PT 1200CL hand-held homogenizer (Kinematica AG, through Brinkmann&#8482; Instruments Inc, Mississauga, Canada) at a setting of 3 (~13,000 RPM), which had been equipped with a 7-mm easy-care generator (PT-DA 1207/2EC). Total RNA was extracted using RNeasy Lipid Tissue Mini Kit (Qiagen Inc., Missisauga, Canada), following the manufacturer's protocol with the modification of using 1.5-ml Phase Lock Gel&#8482; Heavy Tube (Eppendorf Scientific, through Fisher Scientific, Ottawa, Canada) for more robust phase separation. Also, while on the column, samples underwent DNase I treatment during RNA extraction. Standard care was used to avoid RNA degradation: reagents were prepared with diethyl pyrocarbonate (DEPC)-treated water and all surfaces and equipment were treated with an RNase decontamination solution (RNaseZap<sup>&#174; </sup>and RNaseZap<sup>&#174; </sup>Wipes; Ambion Inc., Austin, Texas, USA). The quality and quantity of the RNA samples were tested on an Agilent 2100 Bioanalyzer with the RNA 6000 Nano LabChip<sup>&#174; </sup>Kit (Agilent Technologies Canada Inc., Mississauga, Canada).</p>
         </sec>
         <sec>
            <st>
               <p>Harvesting adult brain regions by Laser Capture Microdissection (LCM)</p>
            </st>
            <p>Brains (1&#8211;3 per region; exception: 7 per Ependymal and Subependymal Layers), recovered as above, were immediately frozen on dry ice and mounted in OCT (Optimal Cutting Temperature) embedding medium. For the Visual Cortex (SM147), Cerebellar White Matter (SM182), Dorsal Striatum (SM195), and Cerebellar Purkinje cells (SM196) sagittal sections were processed, while coronal sections were used for the remaining tissues. Cryosections (20 &#956;m) of fresh-frozen tissues were mounted onto RNase-free membrane slides (Molecular Machines &amp; Industries AG (MMI), Glattbrugg, Switzerland) manufactured for LCM. To identify the desired regions for processing by LCM, each slide was individually stained with a modified Nissl-substance stain using cresyl violet (CV) dye (Polysciences, Inc., Warrington, PA) as follows: Slide-mounted sections were air-dried for 2&#8211;3 min and the surrounding OCT medium was rinsed off with 1&#215; PBS (made with DEPC water). Tissue was fixed for 30 sec with 75% ethanol, stained for 1 min with 0.5% CV, then sequentially rinsed for 5&#8211;10 sec with 75%, 95%, and 100% ethanol. After air-drying for 2&#8211;3 min, sections were immediately dissected with the SL &#956;CUT system (MMI AG; Glattbrugg, Switzerland) under the 10&#215; objective of a Nikon Eclipse TE2000-S, at laser power &lt; 70 mV, for no longer than 15 min. The cut regions were collected onto the adhesive cap of a 500-&#956;l microfuge tube (MMI AG, Glattbrugg, Switzerland) designed for the SL &#956;CUT system, digested with 30 &#956;l lysis buffer RLT (RNeasy Micro Kit; Qiagen Inc., Missisauga, Canada), and transferred from the cap to the vial. The samples were vortexed, centrifuged for 5 sec, and then stored at -80&#176;C until RNA extraction (as above). High-quality samples were pooled within groups for SAGE library generation.</p>
         </sec>
         <sec>
            <st>
               <p>SAGE library preparation</p>
            </st>
            <p>The LongSAGE-Lite method was used to construct the libraries as previously described <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. In brief, first strand cDNA was synthesized with Powerscript Reverse Transcriptase (Clontech, BD Biosciences, Mississauga, Canada) and LITE1/LITE TS primer mix (Invitrogen, Carlsbad, CA) using 15&#8211;120 ng of DNase-treated total RNA, and amplified by a 20-cycle PCR according to the SAGE-Lite method <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. SAGE-Lite biochemistry for the generation of full-length cDNA libraries is based upon the SMART (Switching Mechanism At the 5' end of RNA Transcripts) cDNA synthesis strategy (Clontech, BD Biosciences, Mississauga, Canada). Following amplification, the cDNA were processed according to an adaptation of the standard LongSAGE protocol using the I-SAGE Long kit (Invitrogen, Carlsbad, CA). The SAGE protocol includes steps of anchoring by <it>Nla</it>III, tagging by <it>Mme</it>I, and generating 131 bp ditags by T4 DNA ligase. The 131 bp ditags were amplified using the scale-up PCR varying from 23&#8211;27 cycles depending on the optimal scale up condition as described in the protocol, and were digested with <it>Nla</it>III to remove adapter sequences. Purified 36-bp ditags were ligated to form concatemers that were cloned into <it>Sph</it>I-digested pZErO-1 vector (Invitrogen, Carlsbad, CA), and transformations were done using One Shot DH10B T1 electrocompetent <it>E. coli </it>(Invitrogen, Carlsbad, CA).</p>
            <p>After transformants had been screened by colony PCR, the fraction containing concatemers of sizes ranging from 900 bp-1300 bp was chosen for sequencing. Colonies were picked using a Q-Pix robot (Genetix, Beaverton, OR) and inoculated into 2xYT media with Zeocin (50 &#956;g/ml) and glycerol (7.5%). After overnight culture, glycerol stocks were used to inoculate larger volume cultures for plasmid preparation, carried out using a standard alkaline-lysis procedure adapted for high-throughput processing with microtiter plates. DNA sequencing was performed with BigDye v3.1 dye terminator cycle sequencing reactions run on Tetrad thermal cyclers (MJ Research, Waltham, MA). Products from the sequencing reaction were purified by ethanol precipitation and then run on capillary DNA sequencers (Model 3730xl, Applied Biosystems, Foster City, CA).</p>
            <p>Following inspection of data quality from a first 384-well sequencing plate, each library was sequenced to a depth of > 100,000 raw tags. The resulting sequence data were collected automatically and processed by both trimming the reads for sequence quality and removing sequences from non-recombinant clones, vector DNA and linker-derived tags. Processed data can be found on the Mouse Atlas website (please see Availability &amp; requirements for more information)</p>
         </sec>
         <sec>
            <st>
               <p>SAGE data analysis</p>
            </st>
            <p>To obtain high quality SAGE tags for this study, all raw SAGE tags underwent a three-step cluster modification process developed by Siddiqui et al. <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. In the first step, we calculated for each tag a <it>P </it>value based on the <it>Phred </it>quality score <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> to identify single nucleotide variants likely to originate from sequencing error. In the second step, we used tag sequence clustering to group such variants to combine tags likely to originate from a common transcript. Thus, some singletons were clustered and counted as a more abundant tag. The third step was to filter out low quality tags and compare each <it>P </it>value to a meta-library <it>P </it>value calculated from all SAGE libraries. Tag-to-gene-mapping was then carried out using DiscoverySpace 4.0 application <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. All cluster-modified tags were then mapped to transcripts in the NCBI Reference Sequence Collection <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>. The remaining unmapped tags were mapped to transcripts in the Mammalian Gene Collection <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>, followed by the Ensembl database <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. Only sense transcripts and unique mappings were considered, and tags that mapped to more than one transcript in any of the three transcript databases were discarded. The three mapping results were subsequently merged based on gene symbol.</p>
            <p>For each gene, a <it>P </it>value was assigned to each target (TL; brain region of interest) and off-target (OTL; background region) library pair using the <it>P </it>value option in DiscoverySpace. The <it>P </it>value was computed based on Audic-Claverie algorithms <abbrgrp><abbr bid="B44">44</abbr></abbrgrp> to assess confidence level of differential expression between two transcript libraries. A ranking system was implemented to facilitate selection of candidate genes with specific or enriched expression in each target library (Table <tblr tid="T2">2</tblr>). Region-specific transcripts were obtained by selecting transcripts detected with 5 tags or more only in one target library. To identify region-enriched transcripts, those detected in one target library and one off-target library (<it>P</it><sub><it>TL</it>-<it>OTL </it></sub>value &lt; = 0.05) were selected. Transcripts detected in multiple libraries were ranked based on pre-defined <it>P </it>value limits of differential expression (<it>P</it><sub><it>TL</it>-<it>TL</it></sub>, <it>P</it><sub><it>TL</it>-<it>OTL</it></sub>), as well as additional criteria such as target and off-target library counts. Transcripts whose expression patterns did not fit these criteria were not ranked.</p>
            <p>To analyze transcriptome similarity of tissues, a dendrogram was generated using MATLAB 7 (The MathWorks, Natick, MA) based on hierarchical clustering using the Unweighted Pair Group Method with Arithmetic Mean (UPGMA). The input data is a list of objects (tissue SAGE libraries) with their pair-wise distances (expression divergence ED; see below), and the output is a dendrogram. Initially, each object is in its own cluster; then, at each step of the hierarchical clustering the nearest two clusters are combined into a higher-level cluster. The distance between any two clusters A and B is taken to be the average of all distances between pairs of objects in A and B. Thus, we defined pair-wise distance or expression divergence (ED) between any two tissues as the fraction of differentially expressed genes in their corresponding SAGE libraries, using the formula:</p>
            <p>
               <display-formula>ED<sub>(<it>p</it>) </sub>= N<sub>diff(<it>p</it>)</sub>/N</display-formula>
            </p>
            <p>(N<sub>diff(<it>p</it>) </sub>= number of differentially expressed genes for a given <it>P </it>value, N = number of shared genes between two corresponding libraries).</p>
         </sec>
         <sec>
            <st>
               <p>Semi-automated Literature mining</p>
            </st>
            <p>All synonyms for 28,000 mouse genes were obtained from Entrez (RefSeq release 14) combined with Ensembl (build 34) of the mouse genome. Synonyms for the human orthologs were obtained using Compara (Ensembl build 34) to identify similarities between human and mouse together with Homologene (version 47) for homolog detection. In each case, Ensembl and Entrez were used as cross-references for gene identifiers. From these search strings, all names found in the English dictionary were subtracted to remove obfuscating gene terms such as "Ice". Abstracts were parsed from Medline (extraction performed September 7, 2006) and the complete text of articles were parsed from PubMed Central <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>, and converted into individual sentences using the medical sentence parser <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. Each sentence was searched for the co-occurrence of gene names with brain regions of interest. For each brain region, expanded search terms were applied referring to finer structures appropriate to the region as defined by the ontology available from the Allen Brain Atlas website <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. The number of sentences with gene names and brain regions obtained is greater than the number of sentences with only brain regions because of the plural nature of both search terms. We scrutinized retrieved publications for details indicating regionally enriched/specific expression in a brain region.</p>
         </sec>
         <sec>
            <st>
               <p>Gene Ontology over-representation analysis</p>
            </st>
            <p>Gene Ontology <abbrgrp><abbr bid="B19">19</abbr></abbrgrp> over-representation analysis was performed for the 237 genes using the BiNGO <abbrgrp><abbr bid="B47">47</abbr></abbrgrp> plug-in for the Cytoscape <abbrgrp><abbr bid="B48">48</abbr></abbrgrp> software package. Significance of over-representation of GO terms was calculated using the hypergeometric test, corrected for multiple testing with a Benjamini &amp; Hochberg false discovery rate correction <abbrgrp><abbr bid="B49">49</abbr></abbrgrp>, and a cut-off of 0.05 was applied to the result. The test selection of 237 genes was compared to all GO annotated genes in the mouse genome (18535 genes, as of March 18, 2008).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>SAGE: Serial Analysis of Gene Expression; LCM: Laser Capture Microdissection; OCT: Optimal Cutting Temperature; CV: Cresyl violet; DEPC: Diethyl Pyrocarbonate; ABA: Allen Brain Atlas; BAC: Bacterial Artificial Chromosome; GENSAT: Gene Expression Nervous System Atlas; UPGMA: Unweighted Pair Group Method with Arithmetic Mean; ED: Expression Divergence; GO: Gene Ontology.</p>
      </sec>
      <sec>
         <st>
            <p>Availability &amp; requirements</p>
         </st>
         <p>The Pleiades Promoter Project: <url>http://www.pleiades.org</url></p>
         <p>ABA website: <url>http://www.brain-map.org</url>; Seattle (WA): Allen Institute for Brain Science <sup>&#169; </sup>2004&#8211;2007; in accordance with ABA Terms of Use and Citation Policy.</p>
         <p>Mouse Atlas website: <url>http://www.mouseatlas.org/data/supplemental/brain_tags_processed</url></p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>CAD analyzed SAGE data, ABA <it>in situ </it>hybridization data and mined the PubMed database to identify region-enriched genes, carried out GO analysis, and drafted this manuscript. VC analysed SAGE data, ABA <it>in situ </it>hybridization data, mined the PubMed database to identify region-enriched genes, and contributed to the compilation of gene expression summaries in Additional file <supplr sid="S2">2</supplr>. DG confirmed candidature of SAGE and literature mined genes by inspecting ABA images. RV and LLCL performed bioinformatics analysis of SAGE data. Y&#8211;YX and SB laser-microdissected tissues for construction of SAGE libraries. YZ participated in SAGE library construction. MB did the hierarchical clustering analysis of tissue transcriptomes utilizing the java script written by AH. EP&#8211;C participated in data mining and selection of region-enriched genes. EMS conceived of the study, and participated in its design and coordination along with WWW, DG, MAM, RAH, and SJMJ. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We wish to acknowledge financial support from the BC Cancer Foundation, Genome British Columbia, Genome Canada, UBC Institute of Mental Health, Child and Family Research Institute, UBC Office of the Vice President Research, BC Mental Health and Addiction Services, GlaxoSmithKline R &amp; D Ltd., and Canada Research Chair in Genetics and Behaviour (to E.M.S). We are grateful to the SAGE Library Construction Group and the Sequencing Group at the Genome Sciences Centre for technical assistance. We would like to thank Charles De Leeuw for useful comments on this manuscript, and Tracey Weir and Russell Watkins for editorial assistance with the manuscript. S.J.M.J, R.A.H, W.W.W and M.A.M are Michael Smith Foundation for Health Research Scholars. WWW is also a CIHR New Investigator.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Conservation of regional gene expression in mouse and human brain</p>
            </title>
            <aug>
               <au>
                  <snm>Strand</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Aragaki</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Baquet</snm>
                  <fnm>ZC</fnm>
               </au>
               <au>
                  <snm>Hodges</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Holmans</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>KR</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Kooperberg</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Olson</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>PLoS genetics</source>
            <pubdate>2007</pubdate>
            <volume>3</volume>
            <issue>4</issue>
            <fpage>e59</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1853119</pubid>
                  <pubid idtype="pmpid" link="fulltext">17447843</pubid>
                  <pubid idtype="doi">10.1371/journal.pgen.0030059</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Human-mouse genome comparisons to locate regulatory sites</p>
            </title>
            <aug>
               <au>
                  <snm>Wasserman</snm>
                  <fnm>WW</fnm>
               </au>
               <au>
                  <snm>Palumbo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Thompson</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Fickett</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Lawrence</snm>
                  <fnm>CE</fnm>
               </au>
            </aug>
            <source>Nature genetics</source>
            <pubdate>2000</pubdate>
            <volume>26</volume>
            <issue>2</issue>
            <fpage>225</fpage>
            <lpage>228</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/79965</pubid>
                  <pubid idtype="pmpid" link="fulltext">11017083</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Somatodendritic localization and hyperphosphorylation of tau protein in transgenic mice expressing the longest human brain tau isoform</p>
            </title>
            <aug>
               <au>
                  <snm>Gotz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Probst</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Spillantini</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Schafer</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Jakes</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Burki</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Goedert</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Embo J</source>
            <pubdate>1995</pubdate>
            <volume>14</volume>
            <issue>7</issue>
            <fpage>1304</fpage>
            <lpage>1313</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">398215</pubid>
                  <pubid idtype="pmpid">7729409</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Serial analysis of gene expression</p>
            </title>
            <aug>
               <au>
                  <snm>Velculescu</snm>
                  <fnm>VE</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Vogelstein</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kinzler</snm>
                  <fnm>KW</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1995</pubdate>
            <volume>270</volume>
            <issue>5235</issue>
            <fpage>484</fpage>
            <lpage>487</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.270.5235.484</pubid>
                  <pubid idtype="pmpid" link="fulltext">7570003</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Large-scale production of SAGE libraries from microdissected tissues, flow-sorted cells, and cell lines</p>
            </title>
            <aug>
               <au>
                  <snm>Khattra</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Delaney</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Siddiqui</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Asano</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>McDonald</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Pandoh</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Dhalla</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Prabhu</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>K</fnm>
               </au>
               <etal/>
            </aug>
            <source>Genome research</source>
            <pubdate>2007</pubdate>
            <volume>17</volume>
            <issue>1</issue>
            <fpage>108</fpage>
            <lpage>116</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1716260</pubid>
                  <pubid idtype="pmpid" link="fulltext">17135571</pubid>
                  <pubid idtype="doi">10.1101/gr.5488207</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Using the transcriptome to annotate the genome</p>
            </title>
            <aug>
               <au>
                  <snm>Saha</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sparks</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Rago</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Akmaev</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Vogelstein</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kinzler</snm>
                  <fnm>KW</fnm>
               </au>
               <au>
                  <snm>Velculescu</snm>
                  <fnm>VE</fnm>
               </au>
            </aug>
            <source>Nat Biotechnol</source>
            <pubdate>2002</pubdate>
            <volume>20</volume>
            <issue>5</issue>
            <fpage>508</fpage>
            <lpage>512</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nbt0502-508</pubid>
                  <pubid idtype="pmpid" link="fulltext">11981567</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>The Mouse Atlas of Gene Expression Project</p>
            </title>
            <url>http://www.mouseatlas.org</url>
         </bibl>
         <bibl id="B8">
            <title>
               <p>A mouse atlas of gene expression: large-scale digital gene-expression profiles from precisely defined developing C57BL/6J mouse tissues and cells</p>
            </title>
            <aug>
               <au>
                  <snm>Siddiqui</snm>
                  <fnm>AS</fnm>
               </au>
               <au>
                  <snm>Khattra</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Delaney</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Astell</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Asano</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Babakaiff</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Barber</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Beland</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bohacec</snm>
                  <fnm>S</fnm>
               </au>
               <etal/>
            </aug>
            <source>Proceedings of the National Academy of Sciences of the United States of America</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <issue>51</issue>
            <fpage>18485</fpage>
            <lpage>18490</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1311911</pubid>
                  <pubid idtype="pmpid" link="fulltext">16352711</pubid>
                  <pubid idtype="doi">10.1073/pnas.0509455102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>The Pleiades Promoter Project</p>
            </title>
            <url>http://www.pleiades.org/</url>
         </bibl>
         <bibl id="B10">
            <title>
               <p>The NCBI PubMed Database</p>
            </title>
            <url>http://www.pubmed.com</url>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Getting to the (c)ore of knowledge: mining biomedical literature</p>
            </title>
            <aug>
               <au>
                  <snm>De Bruijn</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Int J Med Inform</source>
            <pubdate>2002</pubdate>
            <volume>67</volume>
            <issue>1&#8211;3</issue>
            <fpage>7</fpage>
            <lpage>18</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1386-5056(02)00050-3</pubid>
                  <pubid idtype="pmpid" link="fulltext">12460628</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>The next generation of literature analysis: integration of genomic analysis into text mining</p>
            </title>
            <aug>
               <au>
                  <snm>Scherf</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Epple</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Werner</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Brief Bioinform</source>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <issue>3</issue>
            <fpage>287</fpage>
            <lpage>297</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bib/6.3.287</pubid>
                  <pubid idtype="pmpid" link="fulltext">16212776</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>The Allen Brain Atlas Database</p>
            </title>
            <url>http://www.allenbrainatlas.org/</url>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Genome-wide atlas of gene expression in the adult mouse brain</p>
            </title>
            <aug>
               <au>
                  <snm>Lein</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Hawrylycz</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Ao</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Ayres</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bensinger</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bernard</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Boe</snm>
                  <fnm>AF</fnm>
               </au>
               <au>
                  <snm>Boguski</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Brockway</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Byrnes</snm>
                  <fnm>EJ</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>445</volume>
            <issue>7124</issue>
            <fpage>168</fpage>
            <lpage>176</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature05453</pubid>
                  <pubid idtype="pmpid" link="fulltext">17151600</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Allen Brain Atlas maps 21,000 genes of the mouse brain</p>
            </title>
            <aug>
               <au>
                  <snm>McCarthy</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Lancet Neurol</source>
            <pubdate>2006</pubdate>
            <volume>5</volume>
            <issue>11</issue>
            <fpage>907</fpage>
            <lpage>908</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1474-4422(06)70594-4</pubid>
                  <pubid idtype="pmpid">17086647</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Laser-capture microdissection: opening the microscopic frontier to molecular analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Simone</snm>
                  <fnm>NL</fnm>
               </au>
               <au>
                  <snm>Bonner</snm>
                  <fnm>RF</fnm>
               </au>
               <au>
                  <snm>Gillespie</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Emmert-Buck</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Liotta</snm>
                  <fnm>LA</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>1998</pubdate>
            <volume>14</volume>
            <issue>7</issue>
            <fpage>272</fpage>
            <lpage>276</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(98)01489-9</pubid>
                  <pubid idtype="pmpid" link="fulltext">9676529</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Early events in the histo- and cytogenesis of the vertebrate CNS</p>
            </title>
            <aug>
               <au>
                  <snm>Nakai</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Fujita</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>The International journal of developmental biology</source>
            <pubdate>1994</pubdate>
            <volume>38</volume>
            <issue>2</issue>
            <fpage>175</fpage>
            <lpage>183</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">7981027</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>The GENSAT Database</p>
            </title>
            <url>http://www.gensat.org</url>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Gene ontology: tool for the unification of biology. The Gene Ontology Consortium</p>
            </title>
            <aug>
               <au>
                  <snm>Ashburner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ball</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Blake</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Botstein</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Butler</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Cherry</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Dolinski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Dwight</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Eppig</snm>
                  <fnm>JT</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature genetics</source>
            <pubdate>2000</pubdate>
            <volume>25</volume>
            <issue>1</issue>
            <fpage>25</fpage>
            <lpage>29</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/75556</pubid>
                  <pubid idtype="pmpid" link="fulltext">10802651</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Initial sequencing and comparative analysis of the mouse genome</p>
            </title>
            <aug>
               <au>
                  <snm>Waterston</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>Lindblad-Toh</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Rogers</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Abril</snm>
                  <fnm>JF</fnm>
               </au>
               <au>
                  <snm>Agarwal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Agarwala</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ainscough</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Alexandersson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>An</snm>
                  <fnm>P</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2002</pubdate>
            <volume>420</volume>
            <issue>6915</issue>
            <fpage>520</fpage>
            <lpage>562</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01262</pubid>
                  <pubid idtype="pmpid" link="fulltext">12466850</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Evolutionary conservation of expression profiles between human and mouse orthologous genes</p>
            </title>
            <aug>
               <au>
                  <snm>Liao</snm>
                  <fnm>BY</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Molecular biology and evolution</source>
            <pubdate>2006</pubdate>
            <volume>23</volume>
            <issue>3</issue>
            <fpage>530</fpage>
            <lpage>540</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1093/molbev/msj054</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Forebrain-specific promoter/enhancer D6 derived from the mouse Dach1 gene controls expression in neural stem cells</p>
            </title>
            <aug>
               <au>
                  <snm>Machon</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Bout</snm>
                  <mnm>van den</mnm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Backman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rosok</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Caubit</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Fromm</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Geronimo</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Krauss</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Neuroscience</source>
            <pubdate>2002</pubdate>
            <volume>112</volume>
            <issue>4</issue>
            <fpage>951</fpage>
            <lpage>966</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0306-4522(02)00053-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">12088753</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Quantitative gene expression profiling of mouse brain regions reveals differential transcripts conserved in human and affected in disease models</p>
            </title>
            <aug>
               <au>
                  <snm>Brochier</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Gaillard</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Diguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Caudy</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Dossat</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Segurens</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Roze</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Caboche</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hantraye</snm>
                  <fnm>P</fnm>
               </au>
               <etal/>
            </aug>
            <source>Physiological genomics</source>
            <pubdate>2008</pubdate>
            <volume>33</volume>
            <issue>2</issue>
            <fpage>170</fpage>
            <lpage>179</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1152/physiolgenomics.00125.2007</pubid>
                  <pubid idtype="pmpid" link="fulltext">18252803</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Adult mouse brain gene expression patterns bear an embryologic imprint</p>
            </title>
            <aug>
               <au>
                  <snm>Zapala</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Hovatta</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Ellison</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Wodicka</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Del Rio</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Tennant</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tynan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Broide</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Helton</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Stoveken</snm>
                  <fnm>BS</fnm>
               </au>
               <etal/>
            </aug>
            <source>Proceedings of the National Academy of Sciences of the United States of America</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <issue>29</issue>
            <fpage>10357</fpage>
            <lpage>10362</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1173363</pubid>
                  <pubid idtype="pmpid" link="fulltext">16002470</pubid>
                  <pubid idtype="doi">10.1073/pnas.0503357102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Molecular taxonomy of major neuronal classes in the adult mouse forebrain</p>
            </title>
            <aug>
               <au>
                  <snm>Sugino</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Hempel</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>MN</fnm>
               </au>
               <au>
                  <snm>Hattox</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Shapiro</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>ZJ</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>Nat Neurosci</source>
            <pubdate>2006</pubdate>
            <volume>9</volume>
            <issue>1</issue>
            <fpage>99</fpage>
            <lpage>107</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nn1618</pubid>
                  <pubid idtype="pmpid" link="fulltext">16369481</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Combined application of behavior genetics and microarray analysis to identify regional expression themes and gene-behavior associations</p>
            </title>
            <aug>
               <au>
                  <snm>Letwin</snm>
                  <fnm>NE</fnm>
               </au>
               <au>
                  <snm>Kafkafi</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Benjamini</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Mayo</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Frank</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Luu</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>NH</fnm>
               </au>
               <au>
                  <snm>Elmer</snm>
                  <fnm>GI</fnm>
               </au>
            </aug>
            <source>J Neurosci</source>
            <pubdate>2006</pubdate>
            <volume>26</volume>
            <issue>20</issue>
            <fpage>5277</fpage>
            <lpage>5287</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1523/JNEUROSCI.4602-05.2006</pubid>
                  <pubid idtype="pmpid" link="fulltext">16707780</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Gene expression profiles in rat brain disclose CNS signature genes and regional patterns of functional specialisation</p>
            </title>
            <aug>
               <au>
                  <snm>Stansberg</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Vik-Mo</snm>
                  <fnm>AO</fnm>
               </au>
               <au>
                  <snm>Holdhus</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Breilid</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Srebro</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Petersen</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Jorgensen</snm>
                  <fnm>HA</fnm>
               </au>
               <au>
                  <snm>Jonassen</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Steen</snm>
                  <fnm>VM</fnm>
               </au>
            </aug>
            <source>BMC genomics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>94</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1853090</pubid>
                  <pubid idtype="pmpid" link="fulltext">17408481</pubid>
                  <pubid idtype="doi">10.1186/1471-2164-8-94</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Classification of cDNA array genes that have a highly significant discriminative power due to their unique distribution in four brain regions</p>
            </title>
            <aug>
               <au>
                  <snm>Fang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Tong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Shi</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jakab</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Bowyer</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>DNA and cell biology</source>
            <pubdate>2004</pubdate>
            <volume>23</volume>
            <issue>10</issue>
            <fpage>661</fpage>
            <lpage>674</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1089/dna.2004.23.661</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Identification of region-specific transcription factor genes in the adult mouse brain by medium-scale real-time RT-PCR</p>
            </title>
            <aug>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Okunishi</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hashizume</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Katayama</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ninomiya</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Osato</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Nakamura</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Iida</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kanamori</snm>
                  <fnm>M</fnm>
               </au>
               <etal/>
            </aug>
            <source>FEBS letters</source>
            <pubdate>2004</pubdate>
            <volume>573</volume>
            <issue>1&#8211;3</issue>
            <fpage>214</fpage>
            <lpage>218</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.febslet.2004.07.068</pubid>
                  <pubid idtype="pmpid" link="fulltext">15328000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Mouse brain organization revealed through direct genome-scale TF expression analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Gray</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Fu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Luo</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ferrari</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Tenzen</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Yuk</snm>
                  <fnm>DI</fnm>
               </au>
               <au>
                  <snm>Tsung</snm>
                  <fnm>EF</fnm>
               </au>
               <au>
                  <snm>Cai</snm>
                  <fnm>Z</fnm>
               </au>
               <etal/>
            </aug>
            <source>Science</source>
            <pubdate>2004</pubdate>
            <volume>306</volume>
            <issue>5705</issue>
            <fpage>2255</fpage>
            <lpage>2257</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1104935</pubid>
                  <pubid idtype="pmpid" link="fulltext">15618518</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Constrained binding site diversity within families of transcription factors enhances pattern discovery bioinformatics</p>
            </title>
            <aug>
               <au>
                  <snm>Sandelin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wasserman</snm>
                  <fnm>WW</fnm>
               </au>
            </aug>
            <source>Journal of molecular biology</source>
            <pubdate>2004</pubdate>
            <volume>338</volume>
            <issue>2</issue>
            <fpage>207</fpage>
            <lpage>215</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.jmb.2004.02.048</pubid>
                  <pubid idtype="pmpid" link="fulltext">15066426</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>ORegAnno: an open access database and curation system for literature-derived promoters, transcription factor binding sites and regulatory variation</p>
            </title>
            <aug>
               <au>
                  <snm>Montgomery</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Griffith</snm>
                  <fnm>OL</fnm>
               </au>
               <au>
                  <snm>Sleumer</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Bergman</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Bilenky</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pleasance</snm>
                  <fnm>ED</fnm>
               </au>
               <au>
                  <snm>Prychyna</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>SJ</fnm>
               </au>
            </aug>
            <source>Bioinformatics (Oxford, England)</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <issue>5</issue>
            <fpage>637</fpage>
            <lpage>640</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btk027</pubid>
                  <pubid idtype="pmpid" link="fulltext">16397004</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>PAZAR: a framework for collection and dissemination of cis-regulatory sequence annotation</p>
            </title>
            <aug>
               <au>
                  <snm>Portales-Casamar</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Kirov</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lim</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lithwick</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Swanson</snm>
                  <fnm>MI</fnm>
               </au>
               <au>
                  <snm>Ticoll</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Snoddy</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wasserman</snm>
                  <fnm>WW</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <issue>10</issue>
            <fpage>R207</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2246282</pubid>
                  <pubid idtype="pmpid" link="fulltext">17916232</pubid>
                  <pubid idtype="doi">10.1186/gb-2007-8-10-r207</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Regulatory module network of basic/helix-loop-helix transcription factors in mouse brain</p>
            </title>
            <aug>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>ZJ</fnm>
               </au>
               <au>
                  <snm>Pan</snm>
                  <fnm>YC</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Fu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>NG</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>YX</fnm>
               </au>
               <au>
                  <snm>Qiu</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Shi</snm>
                  <fnm>TL</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <issue>11</issue>
            <fpage>R244</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2258200</pubid>
                  <pubid idtype="pmpid" link="fulltext">18021424</pubid>
                  <pubid idtype="doi">10.1186/gb-2007-8-11-r244</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Expression of a calmodulin-dependent phosphodiesterase isoform (PDE1B1) correlates with brain regions having extensive dopaminergic innervation</p>
            </title>
            <aug>
               <au>
                  <snm>Polli</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Kincaid</snm>
                  <fnm>RL</fnm>
               </au>
            </aug>
            <source>J Neurosci</source>
            <pubdate>1994</pubdate>
            <volume>14</volume>
            <issue>3 Pt 1</issue>
            <fpage>1251</fpage>
            <lpage>1261</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8120623</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Structure and function of human prepro-orexin gene</p>
            </title>
            <aug>
               <au>
                  <snm>Sakurai</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Moriguchi</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Furuya</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kajiwara</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Nakamura</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Yanagisawa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Goto</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>The Journal of biological chemistry</source>
            <pubdate>1999</pubdate>
            <volume>274</volume>
            <issue>25</issue>
            <fpage>17771</fpage>
            <lpage>17776</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.274.25.17771</pubid>
                  <pubid idtype="pmpid" link="fulltext">10364220</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Modulation of the promoter region of prepro-hypocretin by alpha-interferon</p>
            </title>
            <aug>
               <au>
                  <snm>Waleh</snm>
                  <fnm>NS</fnm>
               </au>
               <au>
                  <snm>Apte-Deshpande</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Terao</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ding</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kilduff</snm>
                  <fnm>TS</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2001</pubdate>
            <volume>262</volume>
            <issue>1&#8211;2</issue>
            <fpage>123</fpage>
            <lpage>128</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(00)00544-8</pubid>
                  <pubid idtype="pmpid" link="fulltext">11179675</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Comprehensive transcript analysis in small quantities of mRNA by SAGE-lite</p>
            </title>
            <aug>
               <au>
                  <snm>Peters</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Kassam</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Yonas</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>O'Hare</snm>
                  <fnm>EH</fnm>
               </au>
               <au>
                  <snm>Ferrell</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Brufsky</snm>
                  <fnm>AM</fnm>
               </au>
            </aug>
            <source>Nucleic acids research</source>
            <pubdate>1999</pubdate>
            <volume>27</volume>
            <issue>24</issue>
            <fpage>e39</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">148762</pubid>
                  <pubid idtype="pmpid" link="fulltext">10572191</pubid>
                  <pubid idtype="doi">10.1093/nar/27.24.e39</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Base-calling of automated sequencer traces using phred. II. Error probabilities</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome research</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <issue>3</issue>
            <fpage>186</fpage>
            <lpage>194</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521922</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>DiscoverySpace: an interactive data analysis application</p>
            </title>
            <aug>
               <au>
                  <snm>Robertson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Oveisi-Fordorei</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zuyderduyn</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Varhol</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Fjell</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Marra</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Siddiqui</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <issue>1</issue>
            <fpage>R6</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1839122</pubid>
                  <pubid idtype="pmpid" link="fulltext">17210078</pubid>
                  <pubid idtype="doi">10.1186/gb-2007-8-1-r6</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>The NCBI Reference Sequence Collection</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/RefSeq</url>
         </bibl>
         <bibl id="B42">
            <title>
               <p>The Mammalian Gene Collection</p>
            </title>
            <url>http://mgc.nci.nih.gov</url>
         </bibl>
         <bibl id="B43">
            <title>
               <p>The Ensembl Database</p>
            </title>
            <url>http://www.ensembl.org</url>
         </bibl>
         <bibl id="B44">
            <title>
               <p>The significance of digital gene expression profiles</p>
            </title>
            <aug>
               <au>
                  <snm>Audic</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Claverie</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Genome research</source>
            <pubdate>1997</pubdate>
            <volume>7</volume>
            <issue>10</issue>
            <fpage>986</fpage>
            <lpage>995</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9331369</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>National Institutes of Health moves ahead with "PubMed Central"</p>
            </title>
            <aug>
               <au>
                  <snm>Greenberg</snm>
                  <fnm>DS</fnm>
               </au>
            </aug>
            <source>Lancet</source>
            <pubdate>1999</pubdate>
            <volume>354</volume>
            <issue>9183</issue>
            <fpage>1009</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0140-6736(05)76619-8</pubid>
                  <pubid idtype="pmpid">10501376</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Improved Medical Sentence Parser</p>
            </title>
            <aug>
               <au>
                  <snm>Berman</snm>
                  <fnm>JJ</fnm>
               </au>
            </aug>
            <source>Arch Pathol Lab Med</source>
            <pubdate>2003</pubdate>
            <volume>127</volume>
            <fpage>789</fpage>
            <lpage>813</lpage>
         </bibl>
         <bibl id="B47">
            <title>
               <p>BiNGO: a Cytoscape plugin to assess overrepresentation of gene ontology categories in biological networks</p>
            </title>
            <aug>
               <au>
                  <snm>Maere</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Heymans</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kuiper</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics (Oxford, England)</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <issue>16</issue>
            <fpage>3448</fpage>
            <lpage>3449</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/bti551</pubid>
                  <pubid idtype="pmpid" link="fulltext">15972284</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Cytoscape: a software environment for integrated models of biomolecular interaction networks</p>
            </title>
            <aug>
               <au>
                  <snm>Shannon</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Markiel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ozier</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Baliga</snm>
                  <fnm>NS</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Ramage</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Amin</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Schwikowski</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ideker</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Genome research</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <issue>11</issue>
            <fpage>2498</fpage>
            <lpage>2504</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">403769</pubid>
                  <pubid idtype="pmpid" link="fulltext">14597658</pubid>
                  <pubid idtype="doi">10.1101/gr.1239303</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Controlling the False Discovery Rate: a Practical and Powerful Approach to Multiple Testing</p>
            </title>
            <aug>
               <au>
                  <snm>Benjamini</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hochberg</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Journal of the Royal Statistical Society, Series B</source>
            <pubdate>1995</pubdate>
            <volume>57</volume>
            <fpage>289</fpage>
            <lpage>300</lpage>
         </bibl>
      </refgrp>
   </bm>
</art>
