<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2007-8-5-r76</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Identification of conserved gene expression features between murine mammary carcinoma models and human breast tumors</p>
         </title>
         <aug>
            <au id="A1" ce="yes">
               <snm>Herschkowitz</snm>
               <mi>I</mi>
               <fnm>Jason</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>jih@unc.edu</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Simin</snm>
               <fnm>Karl</fnm>
               <insr iid="I3"/>
               <email>Karl.Simin@umassmed.edu</email>
            </au>
            <au id="A3">
               <snm>Weigman</snm>
               <mi>J</mi>
               <fnm>Victor</fnm>
               <insr iid="I4"/>
               <email>weigman@gmail.com</email>
            </au>
            <au id="A4">
               <snm>Mikaelian</snm>
               <fnm>Igor</fnm>
               <insr iid="I5"/>
               <email>igor.mikaelian@roche.com</email>
            </au>
            <au id="A5">
               <snm>Usary</snm>
               <fnm>Jerry</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>usary@unc.edu</email>
            </au>
            <au id="A6">
               <snm>Hu</snm>
               <fnm>Zhiyuan</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>zhu@med.unc.edu</email>
            </au>
            <au id="A7">
               <snm>Rasmussen</snm>
               <mi>E</mi>
               <fnm>Karen</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>karen_rasmussen@med.unc.edu</email>
            </au>
            <au id="A8">
               <snm>Jones</snm>
               <mi>P</mi>
               <fnm>Laundette</fnm>
               <insr iid="I7"/>
               <email>ljone010@umaryland.edu</email>
            </au>
            <au id="A9">
               <snm>Assefnia</snm>
               <fnm>Shahin</fnm>
               <insr iid="I7"/>
               <email>sa358@georgetown.edu</email>
            </au>
            <au id="A10">
               <snm>Chandrasekharan</snm>
               <fnm>Subhashini</fnm>
               <insr iid="I6"/>
               <email>subhashini_chandrasekharan@med.unc.edu</email>
            </au>
            <au id="A11">
               <snm>Backlund</snm>
               <mi>G</mi>
               <fnm>Michael</fnm>
               <insr iid="I2"/>
               <email>michael.backlund@Vanderbilt.Edu</email>
            </au>
            <au id="A12">
               <snm>Yin</snm>
               <fnm>Yuzhi</fnm>
               <insr iid="I7"/>
               <email>yiny@georgetown.edu</email>
            </au>
            <au id="A13">
               <snm>Khramtsov</snm>
               <mi>I</mi>
               <fnm>Andrey</fnm>
               <insr iid="I8"/>
               <email>andrey1@uchicago.edu</email>
            </au>
            <au id="A14">
               <snm>Bastein</snm>
               <fnm>Roy</fnm>
               <insr iid="I9"/>
               <email>roy.bastien@hci.utah.edu</email>
            </au>
            <au id="A15">
               <snm>Quackenbush</snm>
               <fnm>John</fnm>
               <insr iid="I9"/>
               <email>john.quackenbush@hci.utah.edu</email>
            </au>
            <au id="A16">
               <snm>Glazer</snm>
               <mi>I</mi>
               <fnm>Robert</fnm>
               <insr iid="I7"/>
               <email>glazerr@georgetown.edu</email>
            </au>
            <au id="A17">
               <snm>Brown</snm>
               <mi>H</mi>
               <fnm>Powel</fnm>
               <insr iid="I10"/>
               <email>pbrown@breastcenter.tmc.edu</email>
            </au>
            <au id="A18">
               <snm>Green</snm>
               <mi>E</mi>
               <fnm>Jeffrey</fnm>
               <insr iid="I11"/>
               <email>jegreen@mail.nih.gov</email>
            </au>
            <au id="A19">
               <snm>Kopelovich</snm>
               <fnm>Levy</fnm>
               <insr iid="I12"/>
               <email>kopelovich@nih.gov</email>
            </au>
            <au id="A20">
               <snm>Furth</snm>
               <mi>A</mi>
               <fnm>Priscilla</fnm>
               <insr iid="I7"/>
               <email>paf3@georgetown.edu</email>
            </au>
            <au id="A21">
               <snm>Palazzo</snm>
               <mi>P</mi>
               <fnm>Juan</fnm>
               <insr iid="I13"/>
               <email>Juan.Palazzo@jefferson.edu</email>
            </au>
            <au id="A22">
               <snm>Olopade</snm>
               <mi>I</mi>
               <fnm>Olufunmilayo</fnm>
               <insr iid="I14"/>
               <email>folopade@medicine.bsd.uchicago.edu</email>
            </au>
            <au id="A23">
               <snm>Bernard</snm>
               <mi>S</mi>
               <fnm>Philip</fnm>
               <insr iid="I9"/>
               <email>phil.bernard@hci.utah.edu</email>
            </au>
            <au id="A24">
               <snm>Churchill</snm>
               <mi>A</mi>
               <fnm>Gary</fnm>
               <insr iid="I5"/>
               <email>gary.churchill@jax.org</email>
            </au>
            <au id="A25">
               <snm>Van Dyke</snm>
               <fnm>Terry</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>tvdlab@med.unc.edu</email>
            </au>
            <au id="A26" ca="yes">
               <snm>Perou</snm>
               <mi>M</mi>
               <fnm>Charles</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <insr iid="I15"/>
               <email>cperou@med.unc.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Lineberger Comprehensive Cancer Center</p>
            </ins>
            <ins id="I2">
               <p>Curriculum in Genetics and Molecular Biology, University of North Carolina at Chapel Hill, Chapel Hill, NC 27599, USA</p>
            </ins>
            <ins id="I3">
               <p>Department of Cancer Biology, University of Massachusetts Medical School, Worcester, MA 01605, USA</p>
            </ins>
            <ins id="I4">
               <p>Department of Biology and Program in Bioinformatics and Computational Biology, University of North Carolina at Chapel Hill, Chapel Hill, NC 27599, USA</p>
            </ins>
            <ins id="I5">
               <p>The Jackson Laboratory, Bar Harbor, ME 04609, USA</p>
            </ins>
            <ins id="I6">
               <p>Department of Genetics, University of North Carolina at Chapel Hill, Chapel Hill, NC 27599, USA</p>
            </ins>
            <ins id="I7">
               <p>Department of Oncology, Lombardi Comprehensive Cancer Center, Georgetown University, Washington, DC 20057, USA</p>
            </ins>
            <ins id="I8">
               <p>Department of Pathology, University of Chicago, Chicago, IL 60637, USA</p>
            </ins>
            <ins id="I9">
               <p>Department of Pathology, University of Utah School of Medicine, Salt Lake City, UT 84132, USA</p>
            </ins>
            <ins id="I10">
               <p>Baylor College of Medicine, Houston, TX 77030, USA</p>
            </ins>
            <ins id="I11">
               <p>Transgenic Oncogenesis Group, Laboratory of Cancer Biology and Genetics</p>
            </ins>
            <ins id="I12">
               <p>Chemoprevention Agent Development Research Group, National Cancer Institute, Bethesda, MD 20892, USA</p>
            </ins>
            <ins id="I13">
               <p>Department of Pathology, Thomas Jefferson University, Philadelphia, PA 19107, USA</p>
            </ins>
            <ins id="I14">
               <p>Section of Hematology/Oncology, Department of Medicine, Committees on Genetics and Cancer Biology, University of Chicago, Chicago, IL 60637, USA</p>
            </ins>
            <ins id="I15">
               <p>Department of Pathology and Laboratory Medicine, University of North Carolina at Chapel Hill, Chapel Hill, NC 27599, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>5</issue>
         <fpage>R76</fpage>
         <url>http://genomebiology.com/2007/8/5/R76</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17493263</pubid>
               <pubid idtype="doi">10.1186/gb-2007-8-5-r76</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>29</day>
               <month>8</month>
               <year>2006</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>18</day>
               <month>1</month>
               <year>2007</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>10</day>
               <month>5</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>10</day>
               <month>05</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Herschkowitz, et al., licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Breast cancer-model expression</p>
      </shorttitle>
      <shortabs>
         <p>Comparison of mammary tumor gene-expression profiles from thirteen murine models using microarrays and with that of human breast tumors showed that many of the defining characteristics of human subtypes were conserved among mouse models.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Although numerous mouse models of breast carcinomas have been developed, we do not know the extent to which any faithfully represent clinically significant human phenotypes. To address this need, we characterized mammary tumor gene expression profiles from 13 different murine models using DNA microarrays and compared the resulting data to those from human breast tumors.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Unsupervised hierarchical clustering analysis showed that six models (TgWAP-<it>Myc</it>, TgMMTV-<it>Neu</it>, TgMMTV-<it>PyMT</it>, TgWAP-<it>Int3</it>, TgWAP-<it>Tag</it>, and TgC3(1)-<it>Tag</it>) yielded tumors with distinctive and homogeneous expression patterns within each strain. However, in each of four other models (TgWAP-<it>T</it><sub><it>121</it></sub>, TgMMTV-<it>Wnt1</it>, <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-<it>Cre</it>;<it>p53</it><sup>+/- </sup>and DMBA-induced), tumors with a variety of histologies and expression profiles developed. In many models, similarities to human breast tumors were recognized, including proliferation and human breast tumor subtype signatures. Significantly, tumors of several models displayed characteristics of human basal-like breast tumors, including two models with induced <it>Brca1 </it>deficiencies. Tumors of other murine models shared features and trended towards significance of gene enrichment with human luminal tumors; however, these murine tumors lacked expression of estrogen receptor (ER) and ER-regulated genes. TgMMTV-<it>Neu </it>tumors did not have a significant gene overlap with the human HER2+/ER- subtype and were more similar to human luminal tumors.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>Many of the defining characteristics of human subtypes were conserved among the mouse models. Although no single mouse model recapitulated all the expression features of a given human subtype, these shared expression features provide a common framework for an improved integration of murine mammary tumor models with human breast tumors.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010003">Cancer</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010015">Model organisms</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Global gene expression analyses of human breast cancers have identified at least three major tumor subtypes and a normal breast tissue group <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Two subtypes are estrogen receptor (ER)-negative with poor patient outcomes <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>; one of these two subtypes is defined by the high expression of HER2/ERBB2/NEU (HER2+/ER-) and the other shows characteristics of basal/myoepithelial cells (basal-like). The third major subtype is ER-positive and Keratin 8/18-positive, and designated the 'luminal' subtype. This subtype has been subdivided into good outcome 'luminal A' tumors and poor outcome 'luminal B' tumors <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>. These studies emphasize that human breast cancers are multiple distinct diseases, with each of the major subtypes likely harboring different genetic alterations and responding distinctly to therapy <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>. Further similar investigations may well identify additional subtypes useful in diagnosis and treatment; however, such research would be accelerated if the relevant disease properties could be accurately modeled in experimental animals. Signatures associated with specific genetic lesions and biologies can be causally assigned in such models, potentially allowing for refinement of human data.</p>
         <p>Significant progress in the ability to genetically engineer mice has led to the generation of models that recapitulate many properties of human cancers <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. Mouse mammary tumor models have been designed to emulate genetic alterations found in human breast cancers, including inactivation of TP53, BRCA1, and RB, and overexpression of MYC and HER2/ERBB2/NEU. Such models have been generated through several strategies, including transgenic overexpression of oncogenes, expression of dominant interfering proteins, targeted disruption of tumor suppressor genes, and by treatment with chemical carcinogens <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. While there are many advantages to using the mouse as a surrogate, there are also potential caveats, including differences in mammary physiologies and the possibility of unknown species-specific pathway differences. Furthermore, it is not always clear which features of a human cancer are most relevant for disease comparisons (for example, genetic aberrations, histological features, tumor biology). Genomic profiling provides a tool for comparative cancer analysis and offers a powerful means of cross-species comparison. Recent studies applying microarray technology to human lung, liver, or prostate carcinomas and their respective murine counterparts have reported commonalities <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>. In general, each of these studies focused on a single or few mouse models. Here, we used gene expression analysis to classify a large set of mouse mammary tumor models and human breast tumors. The results provide biological insights among and across the mouse models, and comparisons with human data identify biologically and clinically significant shared features.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Murine tumor analysis</p>
            </st>
            <p>To characterize the diversity of biological phenotypes present within murine mammary carcinoma models, we performed microarray-based gene expression analyses on tumors from 13 different murine models (Table <tblr tid="T1">1</tblr>) using Agilent microarrays and a common reference design <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. We performed 122 microarrays consisting of 108 unique mammary tumors and 10 normal mammary gland samples (Additional data file 1). Using an unsupervised hierarchical cluster analysis of the data (Additional data file 2), murine tumor profiles indicated the presence of gene sets characteristic of endothelial cells, fibroblasts, adipocytes, lymphocytes, and two distinct epithelial cell types (basal/myoepithelial and luminal). Grouping of the murine tumors in this unsupervised cluster showed that some models developed tumors with consistent, model-specific patterns of expression, while other models showed greater diversity and did not necessarily group together. Specifically, the TgWAP-<it>Myc</it>, TgMMTV-<it>Neu</it>, TgMMTV-<it>PyMT</it>, TgWAP-<it>Int3 </it>(<it>Notch4</it>), TgWAP-<it>Tag </it>and TgC3(1)-<it>Tag </it>tumors had high within-model correlations. In contrast, tumors from the TgWAP-<it>T</it><sub><it>121</it></sub>, TgMMTV-<it>Wnt1</it>, <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, and DMBA-induced models showed diverse expression patterns. The <it>p53</it><sup>-/- </sup>transplant model tended to be homogenous, with 4/5 tumors grouping together, while the <it>Brca1</it><sup>+/-</sup>;<it>p53</it><sup>+/- </sup>ionizing radiation (IR) and <it>p53</it><sup>+/- </sup>IR models showed somewhat heterogeneous features between tumors; yet, 6/7 <it>Brca1</it><sup>+/-</sup>;<it>p53</it><sup>+/- </sup>IR and 5/7 <it>p53</it><sup>+/- </sup>IR were all present within a single dendrogram branch.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Summary of mouse mammary tumor models</p>
               </caption>
               <tblbdy cols="6">
                  <r>
                     <c ca="left">
                        <p>Tumor model</p>
                     </c>
                     <c ca="center">
                        <p>No. of tumors</p>
                     </c>
                     <c ca="center">
                        <p>Specificity of lesions</p>
                     </c>
                     <c ca="left">
                        <p>Experimental oncogenic lesion(s)</p>
                     </c>
                     <c ca="center">
                        <p>Strain</p>
                     </c>
                     <c ca="center">
                        <p>Reference</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgWAP-<it>Myc</it></p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>WAP*</p>
                     </c>
                     <c ca="left">
                        <p>cMyc overexpression</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[60]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgWAP-<it>Int3</it></p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>WAP</p>
                     </c>
                     <c ca="left">
                        <p>Notch4 overexpression</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[61]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgWAP-<it>T</it><sub><it>121</it></sub></p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>WAP</p>
                     </c>
                     <c ca="left">
                        <p>pRb, p107, p130 inactivation</p>
                     </c>
                     <c ca="center">
                        <p>B6D2</p>
                     </c>
                     <c ca="center">
                        <p>[37]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgWAP-<it>T</it><sub><it>121</it></sub></p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>WAP</p>
                     </c>
                     <c ca="left">
                        <p>pRb, p107, p130 inactivation</p>
                     </c>
                     <c ca="center">
                        <p>BALB/cJ</p>
                     </c>
                     <c ca="center">
                        <p>[37]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgWAP-<it>Tag</it></p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>WAP</p>
                     </c>
                     <c ca="left">
                        <p>SV40 L-T (pRb, p107, p130, p53, p300 inactivation, others); SV40 s-t</p>
                     </c>
                     <c ca="center">
                        <p>C57Bl/6</p>
                     </c>
                     <c ca="center">
                        <p>[62]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgC3(1)-<it>Tag</it></p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>C3(1)<sup>&#8224;</sup></p>
                     </c>
                     <c ca="left">
                        <p>SV40 L-T (pRb, p107, p130, p53, p300 inactivation, others); SV40 s-t</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[63]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgMMTV-<it>Neu</it></p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>MMTV<sup>&#8225;</sup></p>
                     </c>
                     <c ca="left">
                        <p>Unactivated rat Her2 overexpression</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[64]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgMMTV-<it>Wnt1</it></p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>MMTV</p>
                     </c>
                     <c ca="left">
                        <p>Wnt 1 overexpression</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[65]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgMMTV-<it>PyMT</it></p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>MMTV</p>
                     </c>
                     <c ca="left">
                        <p>Py-MT (activation of Src, PI-3' kinase, and Shc)</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[66]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>TgMMTV-<it>Cre</it>;<it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;<it>p</it>53<sup>+/-</sup></p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>MMTV</p>
                     </c>
                     <c ca="left">
                        <p>Brca1 truncation mutant; p53 heterozygous null</p>
                     </c>
                     <c ca="center">
                        <p>C57Bl/6</p>
                     </c>
                     <c ca="center">
                        <p>[67]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p><it>p</it>53<sup>-/-</sup>transplanted</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>None</p>
                     </c>
                     <c ca="left">
                        <p>p53 inactivation</p>
                     </c>
                     <c ca="center">
                        <p>BALB/cJ</p>
                     </c>
                     <c ca="center">
                        <p>[68]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Medroxyprogesterone-DMBA-induced</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>None</p>
                     </c>
                     <c ca="left">
                        <p>Random DMBA-induced</p>
                     </c>
                     <c ca="center">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>[69]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p><it>p</it>53<sup>+/-</sup>irradiated</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>None</p>
                     </c>
                     <c ca="left">
                        <p>p53 heterozygous null, random IR induced</p>
                     </c>
                     <c ca="center">
                        <p>BALB/cJ</p>
                     </c>
                     <c ca="center">
                        <p>[70]</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p><it>Brca1</it><sup>+/-</sup>;<it>p</it>53<sup>+/-</sup>irradiated</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>None</p>
                     </c>
                     <c ca="left">
                        <p>Brca1 and p53 heterozygous null, random IR induced</p>
                     </c>
                     <c ca="center">
                        <p>BALB/cJ</p>
                     </c>
                     <c ca="center">
                        <p>[1]</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*WAP, <it>whey acidic protein </it>promoter, commonly restricted to lactating mammary gland luminal cells. <sup>&#8224;</sup>C3(1), 5' flanking region of the C3(1) component of the rat prostate steroid binding protein, expressed in mammary ductal cells. <sup>&#8225;</sup>MMTV, mouse mammary tumor virus promoter, often expressed in virgin mammary gland epithelium, induced with lactation; often expressed at ectopic sites (for example, lymphoid cells, salivary gland, others).</p>
               </tblfn>
            </tbl>
            <p>As with previous human tumor studies <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B3">3</abbr></abbrgrp>, we performed an 'intrinsic' analysis to select genes consistently representative of groups/classes of murine samples. In the human studies, expression variation for each gene was determined using biological replicates from the same patient, and the 'intrinsic genes' identified by the algorithm had relatively low variation within biological replicates and high variation across individuals. In contrast, in this mouse study we applied the algorithm to groups of murine samples defined by an empirically determined correlation threshold of > 0.65 using the dendrogram from Additional data file 2. This 'intrinsic' analysis yielded 866 genes that we then used in a hierarchical cluster analysis (Figure <figr fid="F1">1</figr> and Additional data file 3 for the complete cluster diagram). This analysis identified ten potential groups containing five or more samples each, including a normal mammary gland group (Group I) and nine tumor groups (designated Groups II-X).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Mouse models intrinsic gene set cluster analysis</p>
               </caption>
               <text>
                  <p>Mouse models intrinsic gene set cluster analysis. <b>(a) </b>Overview of the complete 866 gene cluster diagram. <b>(b) </b>Experimental sample associated dendrogram colored to indicate ten groups. <b>(c) </b>Luminal epithelial gene expression pattern that is highly expressed in TgMMTV-<it>PyMT</it>, TgMMTV-<it>Neu</it>, and TgWAP-<it>myc </it>tumors. <b>(d) </b>Genes encoding components of the basal lamina. <b>(e) </b>A second basal epithelial cluster of genes, including <it>Keratin </it>5. <b>(f) </b>Genes expressed in fibroblast cells and implicated in epithelial to mesenchymal transition, including <it>snail homolog </it>1. <b>(g) </b>A second mesenchymal cluster that is expressed in normals. See Additional data file 2 for the complete cluster diagram with all gene names.</p>
               </text>
               <graphic file="gb-2007-8-5-r76-1"/>
            </fig>
            <p>In general, these ten groups were contained within four main categories that included (Figure <figr fid="F1">1b</figr>, left to right): the normal mammary gland samples (Group I) and tumors with mesenchymal characteristics (Group II); tumors with basal/myoepithelial features (Groups III-V); tumors with luminal characteristics (Groups VI-VIII); and tumors containing mixed characteristics (Groups IX and X). Group I contained all normal mammary gland samples, which showed a high level of similarity regardless of strain, and was characterized by the high expression of basal/myoepithelial (Figure <figr fid="F1">1e</figr>) and mesenchymal features, including <it>vimentin </it>(Figure <figr fid="F1">1g</figr>). Group II samples were derived from several models (2/10 <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, 3/11 DMBA-induced, 1/5 <it>p53</it><sup>-/- </sup>transplant, 1/7 <it>p53</it><sup>+/- </sup>IR, 1/10 TgMMTV-<it>Neu </it>and 1/7 TgWAP-<it>T</it><sub><it>121</it></sub>) and also showed high expression of mesenchymal features (Figure <figr fid="F1">1g</figr>) that were shared with the normal samples in addition to a second highly expressed mesenchymal-like cluster that contained <it>snail homolog 1 </it>(a gene implicated in epithelial-mesenchymal transition <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>), the latter of which was not expressed in the normal samples (Figure <figr fid="F1">1f</figr>). Two TgWAP-<it>Myc </it>tumors at the extreme left of the dendrogram, which showed a distinct spindloid histology, also expressed these mesenchymal-like gene features. Further evidence for a mesenchymal phenotype for Group II tumors came from Keratin 8/18 (K8/18) and smooth muscle actin (SMA) immunofluorescence (IF) analyses, which showed that most spindloid tumors were K8/18-negative and SMA-positive (Figure <figr fid="F2">2l</figr>).</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Immunofluorescence staining of mouse samples for basal/myoepithelial and luminal cytokeratins</p>
               </caption>
               <text>
                  <p>Immunofluorescence staining of mouse samples for basal/myoepithelial and luminal cytokeratins. <b>(a) </b>Wild-type (wt) mammary gland stained for Keratins 8/18 (red) and Keratin 5 (green) shows K8/18 expression in luminal epithelial cells and K5 expression in basal/myoepithelial cells. <b>(b-f) </b>Mouse models that show luminal-like gene expression patterns stained with K8/18 (red) and K5 (green). <b>(g-k) </b>Tumor samples that show basal-like, or mixed luminal and basal characteristics by gene expression, stained for K8/18 (red) and K5 (green). <b>(j) </b>A subset of <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p</it>53<sup>+/-</sup>tumors showing nodules of K5/K8/18 double positive cells. <b>(l) </b>A splindloid tumor stained for K8/18 (red) and smooth muscle actin (green).</p>
               </text>
               <graphic file="gb-2007-8-5-r76-2"/>
            </fig>
            <p>The second large category contained Groups III-V, with Group III (4/11 DMBA-induced and 5/11 <it>Wnt1</it>), Group IV (7/7 Brca1<sup>+/-</sup>;<it>p53</it><sup>+/- </sup>IR, 4/10 <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, 4/6 <it>p53</it><sup>+/- </sup>IR and 3/11 <it>Wnt1</it>) and Group V (4/5 <it>p53</it><sup>-/- </sup>transplant and 1/6 <it>p53</it><sup>+/- </sup>IR), showing characteristics of basal/myoepithelial cells (Figure <figr fid="F1">1d, e</figr>). These features were encompassed within two expression patterns. One cluster included <it>Keratin 14</it>, <it>17 </it>and <it>LY6D </it>(Figure <figr fid="F1">1d</figr>); <it>Keratin 17 </it>is a known human basal-like tumor marker <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B12">12</abbr></abbrgrp>, while <it>LY6D </it>is a member of the Ly6 family of glycosylphosphatidylinositol (GPI)-anchored proteins that is highly expressed in head and neck squamous cell carcinomas <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. This cluster also contained components of the basement membrane (for example, <it>Laminins</it>) and hemidesmosomes (for example, <it>Envoplakin </it>and <it>Desmoplakin</it>), which link the basement membrane to cytoplasmic keratin filaments. A second basal/myoepithelial cluster highly expressed in Group III and IV tumors and a subset of DMBA tumors with squamous morphology was characterized by high expression of <it>ID4</it>, <it>TRIM29</it>, and <it>Keratin 5 </it>(Figure <figr fid="F1">1e</figr>), the latter of which is another human basal-like tumor marker <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B12">12</abbr></abbrgrp>. This gene set is expressed in a smaller subset of models compared to the set described above (Figure <figr fid="F1">1d</figr>), and is lower or absent in most Group V tumors. As predicted by gene expression data, most of these tumors stained positive for <it>Keratin 5 </it>(K5) by IF (Figure <figr fid="F2">2g-k</figr>).</p>
            <p>The third category of tumors (Groups VI-VIII) contained many of the 'homogenous' models, all of which showed a potential 'luminal' cell phenotype: Group VI contained the majority of the TgMMTV-<it>Neu </it>(9/10) and TgMMTV-<it>PyMT </it>(6/7) tumors, while Groups VII and VIII contained most of the TgWAP-<it>Myc </it>tumors (11/13) and TgWAP-<it>Int3 </it>samples (6/7), respectively. A distinguishing feature of these tumors (in particular Group VI) was the high expression of <it>XBP1 </it>(Figure <figr fid="F1">1c</figr>), which is a human luminal tumor-defining gene <abbrgrp><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr></abbrgrp>. These tumors also expressed tight junction structural component genes, including <it>Occludin</it>, <it>Tight Junction Protein 2 </it>and <it>3</it>, and the luminal cell K8/18 (Additional data file 2). IF for K8/18 and K5 confirmed that these tumors all exclusively expressed K8/18 (Figure <figr fid="F2">2b-f</figr>).</p>
            <p>Finally, Group IX (1/10 <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, 4/7 TgWAP-<it>T</it><sub><it>121 </it></sub>tumors and 5/5 TgWAP-<it>Tag </it>tumors) and Group X (8/8 TgC3(1)-<it>Tag</it>) tumors were present at the far right and showed 'mixed' characteristics; in particular, the Group IX tumors showed some expression of luminal (Figure <figr fid="F1">1c</figr>), basal (Figure <figr fid="F1">1d</figr>) and mesenchymal genes (Figure <figr fid="F1">1f</figr>), while Group X tumors expressed basal (Figure <figr fid="F1">1e,f</figr>) and mesenchymal genes (Figure <figr fid="F1">1f,g</figr>).</p>
            <p>IF analyses showed that, as in humans <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B18">18</abbr></abbrgrp>, the murine basal-like models tended to express K5 while the murine luminal models expressed only K8/18. However, some of the murine basal-like models developed tumors that harbored nests of cells of both basal (K5+) and luminal (K8/18+) cell lineages. For example, in some TgMMTV-<it>Wnt1 </it><abbrgrp><abbr bid="B19">19</abbr></abbrgrp>, DMBA-induced (Figure <figr fid="F2">2g,i</figr>), and <it>Brca1</it>-deficient strain tumors, distinct regions of single positive K5 and K8/18 cells were observed within the same tumor. Intriguingly, in some <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/- </sup>samples, nodules of double-positive K5 and K8/18 cells were identified, suggestive of a potential transition state or precursor/stem cell population (Figure <figr fid="F2">2j</figr>), while in some TgMMTV-<it>Wnt1 </it>(Figure <figr fid="F2">2h</figr>) <abbrgrp><abbr bid="B19">19</abbr></abbrgrp> and <it>Brca1</it>-deficient tumors, large regions of epithelioid cells were present that had little to no detectable K5 or K8/18 staining (data not shown).</p>
            <p>The reproducibility of these groups was evaluated using 'consensus clustering' (CC) <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. CC using the intrinsic gene list showed strong concordance with the results sown in Figure <figr fid="F1">1</figr> and supports the existence of most of the groups identified using hierarchical clustering analysis (Additional data file 4). However, our further division of some of the CC-defined groups appears justified based upon biological knowledge. For instance, hierarchical clustering separated the normal mammary gland samples (Group I) and the histologically distinct spindloid tumors (Group II), which were combined into a single group by CC. Groups VI (TgMMTV-<it>Neu </it>and <it>PyMT</it>) and VII (TgWAP-<it>Myc</it>) were likewise separated by hierarchical clustering, but CC placed them into a single category. CC was also performed using all genes that were expressed and varied in expression (taken from Additional data file 2), which showed far less concordance with the intrinsic list-based classifications, and which often separated tumors from individual models into different groups (Figure <figr fid="F3">3c</figr>, bottom most panel); for example, the TgMMTV-<it>Neu </it>tumors were separated into two or three different groups, whereas these were distinct and single groups when analyzed using the intrinsic list. This is likely due to the presence or absence of gene expression patterns coming from other cell types (that is, lymphocytes, fibroblasts, and so on) in the 'all genes' list, which causes tumors to be grouped based upon qualities not coming from the tumor cells <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Unsupervised cluster analysis of the combined gene expression data for 232 human breast tumor samples and 122 mouse mammary tumor samples</p>
               </caption>
               <text>
                  <p>Unsupervised cluster analysis of the combined gene expression data for 232 human breast tumor samples and 122 mouse mammary tumor samples. <b>(a) </b>A color-coded matrix below the dendrogram identifies each sample; the first two rows show clinical ER and HER2 status, respectively, with red = positive, green = negative, and gray = not tested; the third row includes all human samples colored by intrinsic subtype as determined from Additional data file 6; red = basal-like, blue = luminal, pink = HER2+/ER-, yellow = claudin-low and green = normal breast-like. The remaining rows correspond to murine models indicated at the right. <b>(b) </b>A gene cluster containing basal epithelial genes. <b>(c) </b>A luminal epithelial gene cluster that includes <it>XBP1 </it>and <it>GATA3</it>. <b>(d) </b>A second luminal cluster containing <it>Keratins </it>8 and 18. <b>(e) </b>Proliferation gene cluster. <b>(f) </b>Interferon-regulated genes. <b>(g) </b>Fibroblast/mesenchymal enriched gene cluster. <b>(h) </b>The <it>Kras2 </it>amplicon cluster. See Additional data file 5 for the complete cluster diagram.</p>
               </text>
               <graphic file="gb-2007-8-5-r76-3"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Mouse-human combined unsupervised analysis</p>
            </st>
            <p>The murine gene clusters were reminiscent of gene clusters identified previously in human breast tumor samples. To more directly evaluate these potential shared characteristics, we performed an integrated analysis of the mouse data presented here with an expanded version of our previously reported human breast tumor data. The human data were derived from 232 microarrays representing 184 primary breast tumors and 9 normal breast samples also assayed on Agilent microarrays and using a common reference strategy (combined human datasets of <abbrgrp><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp> plus 58 new patients/arrays). To combine the human and mouse datasets, we first used the Mouse Genome Informatics database to identify well-annotated mouse and human orthologous genes. We then performed a distance weighted discrimination correction, which is a supervised analysis method that identifies systematic differences present between two datasets and makes a global correction to compensate for these global biases <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. Finally, we created an unsupervised hierarchical cluster of the mouse and human combined data (Figure <figr fid="F3">3</figr> and Additional data file 5 for the complete cluster diagram).</p>
            <p>This analysis identified many shared features, including clusters that resemble the cell-lineage clusters described above. Specifically, human basal-like tumors and murine <it>Brca1</it><sup>+/-</sup>;<it>p53</it><sup>+/-</sup>;IR, <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, TgMMTV-<it>Wnt1</it>, and some DMBA-induced tumors were characterized by the high expression of <it>Laminin gamma 2</it>, <it>Keratins 5</it>, <it>6B</it>, <it>13</it>, <it>14</it>, <it>15</it>, <it>TRIM29</it>, <it>c-KIT </it>and <it>CRYAB </it>(Figure <figr fid="F3">3b</figr>), the last of which is a human basal-like tumor marker possibly involved in resistance to chemotherapy <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. As described above, the <it>Brca1</it><sup>+/-</sup>;<it>p53</it><sup>+/-</sup>;IR, some <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/</sup>, DMBA-induced, and TgMMTV-<it>Wnt1 </it>tumors stained positive for K5 by IF, and human basal-like tumors tend to stain positive using a K5/6 antibody <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B12">12</abbr><abbr bid="B18">18</abbr><abbr bid="B26">26</abbr></abbrgrp>, thus showing that basal-like tumors from both species share K5 protein expression as a distinguishing feature.</p>
            <p>The murine and human 'luminal tumor' shared profile was not as similar as the shared basal profile, but did include the high expression of <it>SPDEF</it>, <it>XBP1 </it>and <it>GATA3 </it>(Figure <figr fid="F3">3c</figr>), and both species' luminal tumors also stained positive for K8/18 (Figure <figr fid="F2">2</figr> and see <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>). For many genes in this luminal cluster, however, the relative level of expression differed between the two species. For example, some genes were consistently high across both species' tumors (for example, <it>XBP1</it>, <it>SPDEF </it>and <it>GATA3</it>), while others, including <it>TFF</it>, <it>SLC39A6</it>, and <it>FOXA1</it>, were high in human luminal tumors and showed lower expression in murine tumors. Of note is that the human luminal epithelial gene cluster always contains the <it>Estrogen</it>-<it>Receptor </it>(<it>ER</it>) and many estrogen-regulated genes, including <it>TFF1 </it>and <it>SLC39A6 </it><abbrgrp><abbr bid="B22">22</abbr></abbrgrp>; since most murine mammary tumors, including those profiled here, are ER-negative, the apparent lack of involvement of ER and most ER-regulated genes could explain the difference in expression for some of the human luminal epithelial genes that show discordant expression in mice.</p>
            <p>Several other prominent and noteworthy features were also identified across species, including a 'proliferation' signature that includes the well documented proliferation marker Ki-67 (Figure <figr fid="F3">3e</figr>) <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp> and an interferon-regulated pattern (Figure <figr fid="F3">3f</figr>) <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. The proliferation signature was highest in human basal-like tumors and in the murine models with impaired pRb function (that is, Group IX and X tumors). Currently, the growth regulatory impact of interferon-signaling in human breast tumors is not understood, and murine models that share this expression feature (TgMMTV-<it>Neu</it>, TgWAP-Tag, <it>p53</it><sup>-/- </sup>transplants, and spindloid tumors) may provide a model for future studies of this pathway. A fibroblast profile (Figure <figr fid="F3">3g</figr>) that was highly expressed in murine samples with spindloid morphology and in the TgWAP-<it>Myc </it>'spindloid' tumors was also observed in many human luminal and basal-like tumors; however, on average, this profile was expressed at lower levels in the murine tumors, which is consistent with the relative epithelial to stromal cell proportions seen histologically.</p>
            <p>Through these analyses we also discovered a potential new human subtype (Figure <figr fid="F3">3</figr>, top line-yellow group, and Additional data file 6). This subtype, which was apparent in both the human only and mouse-human combined dataset, is referred to as the 'claudin-low' subtype and is characterized by the low expression of genes involved in tight junctions and cell-cell adhesion, including <it>Claudins 3</it>, <it>4</it>, <it>7</it>, <it>Occludin</it>, and <it>E-cadherin </it>(Figure <figr fid="F3">3d</figr>). These human tumors (<it>n </it>= 13) also showed low expression of luminal genes, inconsistent basal gene expression, and high expression of lymphocyte and endothelial cell markers. All but one tumor in this group was clinically ER-negative, and all were diagnosed as grade II or III infiltrating ductal carcinomas (Additional data file 7 for representative hematoxylin and eosin images); thus, these tumors do not appear to be lobular carcinomas as might be predicted by their low expression of <it>E-cadherin</it>. The uniqueness of this group was supported by shared mesenchymal expression features with the murine spindloid tumors (Figure <figr fid="F3">3g</figr>), which cluster near these human tumors and also lack expression of the <it>Claudin </it>gene cluster (Figure <figr fid="F3">3d</figr>). Further analyses will be required to determine the cellular origins of these human tumors.</p>
         </sec>
         <sec>
            <st>
               <p>A common region of amplification across species</p>
            </st>
            <p>The murine C3(1)-<it>Tag </it>tumors and a subset of human basal-like tumors showed high expression of a cluster of genes, including <it>Kras2</it>, <it>Ipo8</it>, <it>Ppfibp1</it>, <it>Surb</it>, and <it>Cmas</it>, that are all located in a syntenic region corresponding to human chromosome 12p12 and mouse chromosome 6 (Figure <figr fid="F3">3h</figr>). <it>Kras2 </it>amplification is associated with tumor progression in the C3(1)-<it>Tag </it>model <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>, and haplo-insufficiency of <it>Kras2 </it>delays tumor progression <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. High co-expression of <it>Kras2</it>-linked genes prompted us to test whether DNA copy number changes might also account for the high expression of <it>Kras2 </it>among a subset of the human tumors. Indeed, 9 of 16 human basal-like tumors tested by quantitative PCR had increased genomic DNA copy numbers at the <it>KRAS2 </it>locus; however, no mutations were detected in <it>KRAS2 </it>in any of these 16 basal-like tumors. In addition, van Beers <it>et al</it>. <abbrgrp><abbr bid="B31">31</abbr></abbrgrp> reported that this region of human chromosome 12 is amplified in 47% of <it>BRCA1</it>-associated tumors by comparative genomic hybridization analysis; <it>BRCA1</it>-associated tumors are known to exhibit a basal-like molecular profile <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B32">32</abbr></abbrgrp>. In cultured human mammary epithelial cells, which show basal/myoepithelial characteristics <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B33">33</abbr></abbrgrp>, both high oncogenic H-ras and SV40 Large T-antigen expression are necessary for transformation <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. Taken together, these findings suggest that amplification of <it>KRAS2 </it>may either influence the cellular phenotype or define a susceptible target cell type for basal-like tumors.</p>
         </sec>
         <sec>
            <st>
               <p>Mouse-human shared intrinsic features</p>
            </st>
            <p>To simultaneously classify mouse and human tumors, we identified the gene set that was in common between a human breast tumor intrinsic list (1,300 genes described in Hu <it>et al</it>. <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>) and the mouse intrinsic list developed here (866 genes). The overlap of these two lists totaled 106 genes, which when used in a hierarchical clustering analysis (Figure <figr fid="F4">4</figr>) identifies four main groups: the leftmost group contains all the human basal-like, 'claudin-low', and 5/44 HER2+/ER- tumors, and the murine C3(1)-<it>Tag</it>, TgWAP-<it>Tag</it>, and spindloid tumors. The second group (left to right) contains the normal samples from both humans and mice, a small subset (6/44) of human HER2+/ER- and 10/92 luminal tumors, and a significant portion of the remaining murine basal-like models. By clinical criteria, nearly all human tumors in these two groups were clinically classified as ER-negative.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Cluster analysis of mouse and human tumors using the subset of genes common to both species intrinsic lists (106 total genes)</p>
               </caption>
               <text>
                  <p>Cluster analysis of mouse and human tumors using the subset of genes common to both species intrinsic lists (106 total genes). <b>(a) </b>Experimental sample associated dendrogram color coded according to human tumor subtype and with a matrix below showing murine tumor origins. <b>(b) </b>The complete 106 gene cluster diagram. <b>(c) </b>Close-up of genes known to be important for human basal-like tumors. <b>(d) </b>Close-up of genes known to be important for human luminal tumors, including ER. <b>(e) </b>Expression pattern of HER2/ERBB2/NEU.</p>
               </text>
               <graphic file="gb-2007-8-5-r76-4"/>
            </fig>
            <p>The third group contains 33/44 human HER2+/ER- tumors and the murine TgMMTV-<it>Neu</it>, MMTV-PyMT and TgWAP-<it>Myc </it>samples. Although the human HER2+/ER- tumors are predominantly ER-negative, this comparative genomic analysis and their keratin expression profiles as assessed by immunohistochemistry, suggests that the HER2+/ER- human tumors are 'luminal' in origin as opposed to showing basal-like features <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. The fourth and right-most group is composed of ER-positive human luminal tumors and, lastly, the mouse TgWAP-<it>Int3 </it>(<it>Notch4</it>) tumors were in a group by themselves. These data show that although many mouse and human tumors were located on a large dendrogram branch that contained most murine luminal models and human HER2+/ER- tumors, none of the murine models we tested showed a strong human 'luminal' phenotype that is characterized by the high expression of <it>ER</it>, <it>GATA3</it>, <it>XBP1 </it>and <it>FOXA1</it>. These analyses suggest that the murine luminal models like MMTV-<it>Neu </it>showed their own unique profile that was a relatively weak human luminal phenotype that is missing the ER-signature. Presented at the bottom of Figure <figr fid="F4">4</figr> are biologically important genes discussed here, genes previously shown to be human basal-like tumor markers (Figure <figr fid="F4">4c</figr>), human luminal tumor markers, including ER (Figure <figr fid="F4">4d</figr>), and HER2/ERBB2/NEU (Figure <figr fid="F4">4e</figr>).</p>
         </sec>
         <sec>
            <st>
               <p>A comparison of gene sets defining human tumors and murine models</p>
            </st>
            <p>We used a second analysis method called gene set enrichment analysis (GSEA) <abbrgrp><abbr bid="B35">35</abbr></abbrgrp> to search for shared relationships between human tumor subtypes and murine models. For this analysis, we first performed a two-class unpaired significance analysis of microarray (SAM) <abbrgrp><abbr bid="B36">36</abbr></abbrgrp> analysis for each of the ten murine groups defined in Figure <figr fid="F1">1</figr>, and obtained a list of highly expressed genes that defined each group. Next, we performed similar analyses using each human subtype versus all other human tumors. Lastly, the murine lists were compared to each human subtype list using GSEA, which utilizes both gene list overlap and gene rank (Table <tblr tid="T2">2</tblr>). We found that the murine Groups IX (<it>p </it>= 0.004) and X (<it>p </it>= 0.001), which comprised tumors from pRb-deficient/p53-deficient models, shared significant overlap with the human basal-like subtype and tended to be anti-correlated with human luminal tumors (<it>p </it>= 0.083 and 0.006, respectively). Group III murine tumors (TgMMTV-<it>Wnt1 </it>mostly) significantly overlapped human normal breast samples (<it>p </it>= 0.008), possibly due to the expression of both luminal and basal/myoepithelial gene clusters in both groups. Group IV (<it>Brca1-deficient </it>and <it>Wnt1</it>) showed a significant association (<it>p </it>= 0.058) with the human basal-like profile. The murine Group VI (TgMMTV-<it>Neu </it>and TgMMTV-<it>PyMT</it>) showed a near significant association (<it>p </it>= 0.078) with the human luminal profile and were anti-correlated with the human basal-like subtype (<it>p </it>= 0.04). Finally, the murine Group II spindloid tumors showed significant overlap with human 'claudin-low' tumors (<it>p </it>= 0.001), which further suggests that this may be a distinct and novel human tumor subtype.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Gene set enrichment analysis of the ten murine groups versus five human subtypes</p>
               </caption>
               <tblbdy cols="12">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Basal-like</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Luminal</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>HER2+/ER-</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Normal</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Claudin-low</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>Mouse class</p>
                     </c>
                     <c ca="center">
                        <p>No. of genes</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                     <c ca="center">
                        <p><it>p </it>value</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="12">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Is class</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>I</p>
                     </c>
                     <c ca="center">
                        <p>1,882</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.4625</p>
                     </c>
                     <c ca="center">
                        <p>0.8755</p>
                     </c>
                     <c ca="center">
                        <p>0.5388</p>
                     </c>
                     <c ca="center">
                        <p>0.9137</p>
                     </c>
                     <c ca="center">
                        <p>0.1659</p>
                     </c>
                     <c ca="center">
                        <p>0.5628</p>
                     </c>
                     <c ca="center">
                        <p>0.0048</p>
                     </c>
                     <c ca="center">
                        <p>0.1028</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>912</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.5867</p>
                     </c>
                     <c ca="center">
                        <p>0.9609</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.0021</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.001</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>143</p>
                     </c>
                     <c ca="center">
                        <p>0.5289</p>
                     </c>
                     <c ca="center">
                        <p>0.9048</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.5285</p>
                     </c>
                     <c ca="center">
                        <p>0.9047</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.008</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>IV</p>
                     </c>
                     <c ca="center">
                        <p>1,019</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.0581</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>V</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.8492</p>
                     </c>
                     <c ca="center">
                        <p>0.998</p>
                     </c>
                     <c ca="center">
                        <p>0.9324</p>
                     </c>
                     <c ca="center">
                        <p>0.999</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.0427</p>
                     </c>
                     <c ca="center">
                        <p>0.09274</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VI</p>
                     </c>
                     <c ca="center">
                        <p>820</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.0062</p>
                     </c>
                     <c ca="center">
                        <p>0.0783</p>
                     </c>
                     <c ca="center">
                        <p>0.3536</p>
                     </c>
                     <c ca="center">
                        <p>0.7864</p>
                     </c>
                     <c ca="center">
                        <p>0.8653</p>
                     </c>
                     <c ca="center">
                        <p>0.9769</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VII</p>
                     </c>
                     <c ca="center">
                        <p>851</p>
                     </c>
                     <c ca="center">
                        <p>0.1258</p>
                     </c>
                     <c ca="center">
                        <p>0.3768</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.5616</p>
                     </c>
                     <c ca="center">
                        <p>0.9137</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VIII</p>
                     </c>
                     <c ca="center">
                        <p>236</p>
                     </c>
                     <c ca="center">
                        <p>0.1449</p>
                     </c>
                     <c ca="center">
                        <p>0.6098</p>
                     </c>
                     <c ca="center">
                        <p>0.3483</p>
                     </c>
                     <c ca="center">
                        <p>0.8205</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.01878</p>
                     </c>
                     <c ca="center">
                        <p>0.2349</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>IX</p>
                     </c>
                     <c ca="center">
                        <p>462</p>
                     </c>
                     <c ca="center">
                        <p>0.0019</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.004</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.56</p>
                     </c>
                     <c ca="center">
                        <p>0.9509</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>X</p>
                     </c>
                     <c ca="center">
                        <p>338</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.001</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.9275</p>
                     </c>
                     <c ca="center">
                        <p>0.998</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Is not class</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>I</p>
                     </c>
                     <c ca="center">
                        <p>1,882</p>
                     </c>
                     <c ca="center">
                        <p>0.0128</p>
                     </c>
                     <c ca="center">
                        <p>0.1662</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>912</p>
                     </c>
                     <c ca="center">
                        <p>0.3996</p>
                     </c>
                     <c ca="center">
                        <p>0.8348</p>
                     </c>
                     <c ca="center">
                        <p>0.8601</p>
                     </c>
                     <c ca="center">
                        <p>0.999</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.3602</p>
                     </c>
                     <c ca="center">
                        <p>0.7655</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>143</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.3178</p>
                     </c>
                     <c ca="center">
                        <p>0.7259</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.7628</p>
                     </c>
                     <c ca="center">
                        <p>0.991</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>IV</p>
                     </c>
                     <c ca="center">
                        <p>1,019</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.1833</p>
                     </c>
                     <c ca="center">
                        <p>0.6516</p>
                     </c>
                     <c ca="center">
                        <p>0.398</p>
                     </c>
                     <c ca="center">
                        <p>0.8427</p>
                     </c>
                     <c ca="center">
                        <p>0.2241</p>
                     </c>
                     <c ca="center">
                        <p>0.7255</p>
                     </c>
                     <c ca="center">
                        <p>0.1453</p>
                     </c>
                     <c ca="center">
                        <p>0.6116</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>V</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>0.86</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.0656</p>
                     </c>
                     <c ca="center">
                        <p>0.1653</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VI</p>
                     </c>
                     <c ca="center">
                        <p>820</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.04</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.1043</p>
                     </c>
                     <c ca="center">
                        <p>0.4444</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VII</p>
                     </c>
                     <c ca="center">
                        <p>851</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.1733</p>
                     </c>
                     <c ca="center">
                        <p>0.5151</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.5403</p>
                     </c>
                     <c ca="center">
                        <p>0.9128</p>
                     </c>
                     <c ca="center">
                        <p>0.1628</p>
                     </c>
                     <c ca="center">
                        <p>0.5215</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>VIII</p>
                     </c>
                     <c ca="center">
                        <p>236</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.1131</p>
                     </c>
                     <c ca="center">
                        <p>0.5305</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.6427</p>
                     </c>
                     <c ca="center">
                        <p>0.961</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>IX</p>
                     </c>
                     <c ca="center">
                        <p>462</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.04305</p>
                     </c>
                     <c ca="center">
                        <p>0.0833</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.022</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>0.037</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.2612</p>
                     </c>
                     <c ca="center">
                        <p>0.5936</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>X</p>
                     </c>
                     <c ca="center">
                        <p>338</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.02236</p>
                     </c>
                     <c ca="center">
                        <p>0.0682</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>0.1313</p>
                     </c>
                     <c ca="center">
                        <p>0.3717</p>
                     </c>
                     <c ca="center">
                        <p>0.5437</p>
                     </c>
                     <c ca="center">
                        <p>0.9489</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Statistically significant findings are highlighted in bold. NOM = nominal.</p>
               </tblfn>
            </tbl>
            <p>We also performed a two-class unpaired SAM analysis using each mouse model as a representative of a pathway perturbation using the transgenic 'event' as a means of defining groups. Models that yielded a significant gene list (false discovery rate (FDR) = 1%) were compared to each human subtype as described above (Additional data file 8). The models based upon SV40 T-antigen (all C3(1)-Tag and WAP-Tag tumors) shared significant overlap with the human basal-like tumors (<it>p </it>= 0.002) and were marginally anti-correlated with the human luminal class. The BRCA1 deficient models (all Brca1<sup>+/-</sup>;<it>p53</it><sup>+/- </sup>IR and <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/- </sup>tumors) were marginally significant with human basal-like tumors (<it>p </it>= 0.088). The TgMMTV-<it>Neu </it>tumors were nominally significant (before correction for multiple comparisons) with human luminal tumors (<it>p </it>= 0.006) and anti-correlated with human basal-like tumors (<it>p </it>= 0.027).</p>
            <p>The two most important human breast tumor biomarkers are ER and HER2; therefore, we also analyzed these data relative to these two markers. Of the 232 human tumors assayed here, 137 had ER and HER2 data assessed by immunohistochemistry and microarray data. As has been noted before <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B18">18</abbr><abbr bid="B21">21</abbr></abbrgrp>, there is a very high correlation between tumor intrinsic subtype and ER and HER2 clinical status (<it>p </it>&lt; 0.0001): for example, 81% of ER+ tumors were of the luminal phenotype, 63% of HER2+ tumors were classified as HER2+/ER-, and 80% of ER- and HER2- tumors were of the basal-like subtype. Using GSEA, we compared the ten mouse classes as defined in Figure <figr fid="F1">1</figr> (Additional data file 9) and the mouse model-based gene lists (Additional data file 10) to the human data/gene lists that were obtained by performing supervised analyses based upon human ER and HER2 status (please note that analyses using HER2 status alone (that is, HER2+ versus HER2-), and ER+ and HER2+ versus others were not included as human classes because HER2 status alone yielded genes on only the HER2 amplicon, and the ER+ and HER2+ classification did not yield a significant gene list). We found that the murine Groups IX (<it>p </it>= 0.009) and X (<it>p </it>= 0.003) tumors shared significant overlap with ER- HER2- human tumors and were significantly anti-correlated with human ER+ tumors (<it>p </it>= 0.024 and 0.043, respectively). Group VI murine samples (TgMMTV-<it>Neu </it>and TgMMTV-<it>PyMT</it>) likewise showed the same trend of enrichment with ER+ human tumors and anti-correlation with the ER- HER2- class. Although not perfect, these GSEA results are consistent with our observations from Figures <figr fid="F1">1</figr> and <figr fid="F3">3</figr> and again demonstrate that the basal-like profile is robustly shared between humans and mice, while the luminal profile shows some shared and some distinct features across species.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>Gene expression profiling of murine tumors and their comparison to human tumors identified characteristics relevant to individual murine models, to murine models in general, and to cancers of both species. First was the discovery that some murine models developed highly similar tumors within models, while others showed heterogeneity in expression and histological phenotypes. For the homogenous models, the study of progression or response to therapy is simplified because confounding variation across individuals is low. An example of this consistency even extended to secondary events that occurred within the TgC3(1)-<it>Tag </it>model, where many tumors shared the amplification and high expression of <it>Kras2 </it>(Figure <figr fid="F3">3h</figr>) - a feature also evident in a subset of human basal-like tumors.</p>
         <p>In contrast to the 'homogenous' models are models such as TgWAP-<it>T</it><sub><it>121</it></sub>, DMBA-induced and <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>, where individual tumors within a given model often showed different gene expression profiles and histologies. It is likely that these models fall into one of three scenarios that could explain their heterogeneity: the first, represented by the TgWAP-<it>T</it><sub><it>121 </it></sub>model <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>, is that the transgene is responsible only for initiating tumorigenesis, leaving progression events to evolve stochastically and with longer latency periods. Such a model would likely give rise to different tumor subtypes depending on the subsequent pathways that are disrupted during tumor progression. A second possibility is that the initiating event generates genomic instability such that multiple distinct pathways can be affected by the experimental causal event, which may be the mechanism in the <it>Brca1</it>-inactivation tumors. The third scenario is that the target cell of transformation is a multi-potent progenitor with the ability to undergo differentiation into multiple epithelial lineages, or even mesenchymal lineages (for example, DMBA-induced and <it>Brca1</it><sup><it>Co</it>/<it>Co</it></sup>;TgMMTV-Cre;<it>p53</it><sup>+/-</sup>); support for this hypothesis comes from Keratin IF analyses in which, even within a histologically homogenous tumor, two types of epithelial cells are present (Figures <figr fid="F2">2g-k</figr>). The presence of subsets of individual cells positive for markers of two epithelial cell types also supports this possibility (Figure <figr fid="F2">2j</figr>). Alternative hypotheses include the possibility that multiple cell types sustain transforming events, and also that extensive non-cell-autonomous tissue responses occur. Regardless of the paradigm of transformation for these heterogeneous models, the study of progression or therapeutic response will best be accomplished by first sub-setting by subtype, and then focusing on biological phenotypes.</p>
         <p>There are at least two major applications for genomic comparisons between human tumors and their potential murine counterparts. First, such studies should identify those models that contain individual and/or global characteristics of a particular class of human tumors. Examples of important global characteristics identified here include the classification of murine and human tumors into basal and luminal groups. It appears as if four murine models developed potential luminal-like tumors (TgMMTV-<it>Neu</it>, TgMMTV-<it>PyMT</it>, TgWAP-<it>Myc</it>, and TgWAP-<it>Int3</it>), which is not surprising since both MMTV and WAP are thought to direct expression in differentiated alveolar/luminal cells <abbrgrp><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr></abbrgrp>; however, it should be noted that the luminal profile across species was not statistically significant, likely due to the lack of ER and ER-regulated genes in the murine luminal tumors. Several murine models did show expression features consistent with human basal-like tumors, including the TgC3(1)-<it>Tag</it>, TgWAP-<it>Tag </it>and <it>Brca1</it>-deficient models. The SV40 T-antigen used in the TgC3(1)-<it>Tag </it>and TgWAP-<it>Tag </it>models inactivates p53 and RB, which also appear to be two likely events that occur in human basal-like tumors because these tumors are known to harbor <it>p53 </it>mutations <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, have high mitotic grade and the highest expression of proliferation genes (Figure <figr fid="F3">3</figr>) <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>, which are known E2F targets <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. The proliferation signature in human breast cancers is itself prognostic <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>, and is also predictive of response to chemotherapy <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. These data suggest that human basal-like tumors might have impairment of RB function and highlight an important shared feature of murine and human mammary carcinomas.</p>
         <p>The finding that <it>Brca1 </it>loss (coincident with <it>p53 </it>mutation) in mice gives rise to tumors with a basal-like phenotype is notable because humans carrying <it>BRCA1 </it>germline mutations also develop basal-like tumors <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B32">32</abbr></abbrgrp>, and most human <it>BRCA1 </it>mutant tumors are p53-deficient <abbrgrp><abbr bid="B43">43</abbr><abbr bid="B44">44</abbr></abbrgrp>. These data suggest a conserved predisposition of the basal-like cell type, or its progenitor cell, to transform as a result of <it>BRCA1</it>, <it>TP53</it>, and <it>RB</it>-pathway loss. Most DMBA-induced carcinomas also showed basal-like cell lineage features, suggesting that this cell type is also susceptible to DMBA-mediated tumorigenesis. Finally, some TgMMTV-<it>Wnt1 </it>tumors showed a combination of basal-like and luminal characteristics by gene expression, which is consistent with the observation that tumors of this model generally contain cells from both mammary epithelial lineages <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>.</p>
         <p>The second major purpose of comparative studies is to determine the extent to which analyses of murine models can inform the human disease and guide further discovery. An example of murine models informing the human disease is encompassed by the analysis of the new potential human subtype discovered here (that is, claudin-low subtype). Further analysis will be necessary to confirm whether this is a <it>bona fide </it>subtype; however, the statistically significant gene overlap with a histologically distinct subset of murine tumors suggests it is a distinct biological entity. A second example of the murine tumors guiding discovery in humans was the common association of a K-Ras containing amplicon in a subset of human basal-like tumors and in the murine basal-like TgC3(1)-<it>Tag </it>strain tumors.</p>
         <p>An important caveat to all comparative studies is that there are clear biological differences between mice and humans, which may or may not directly impact disease mechanisms. A potential example of inherent species difference could be the aforementioned biology associated with ER and its downstream pathway. In humans, ER is highly expressed in luminal tumors <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>, with the luminal phenotype being characterized by the high expression of some genes that are ER-regulated like <it>PR </it>and <it>RERG </it><abbrgrp><abbr bid="B22">22</abbr></abbrgrp>, and other luminal genes that are likely GATA3-regulated, including <it>AGR2 </it>and <it>K8/18 </it><abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. In mice, ER expression is low to absent in all the tumors we tested, as is the expression of most human ER-responsive genes. This finding is consistent with previous reports that most late-stage murine mammary tumors are ER-negative (<abbrgrp><abbr bid="B47">47</abbr></abbrgrp> and references within). However, it should be noted that two human luminal tumor-defining genes (<it>XBP1 </it>and <it>GATA3 </it><abbrgrp><abbr bid="B46">46</abbr></abbrgrp>, were both highly expressed in murine luminal tumors (Additional data file 2). Taken together, these data suggest that the human 'luminal' profile may actually be a combination of at least two profiles, one of which is ER-regulated and another of which is GATA3-regulated; support for a link between <it>GATA3 </it>and luminal cell origins comes from <it>GATA3 </it>loss studies in mice where the selective loss of <it>GATA3 </it>in the mammary gland resulted in either a lack of luminal cells, or a significant decrease in the number and/or maturation of luminal cells <abbrgrp><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr></abbrgrp>. These results suggest that, in the mouse models tested here, the ER-regulated gene cassette that is present in human luminal tumors is missing, and that the GATA3-mediated luminal signature remains. Due to the partial luminal tumor signature in mice, we believe that the murine luminal models, including TgMMTV-<it>Neu </it>profiled here, best resemble human luminal tumors and more specifically possibly luminal B tumors, which are luminal tumors that express low amounts of ER and show a poor outcome <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B21">21</abbr></abbrgrp>. While human HER2+/ER- subtype tumors and the murine TgMMTV-<it>Neu</it>, TgMMTV-<it>PyMT</it>, and TgWAP-<it>Myc </it>fall next to each other in the intrinsic-shared cluster (Figure <figr fid="F4">4</figr>), all of the other data argue against this association. A few murine ER-positive mammary tumor models have been developed <abbrgrp><abbr bid="B50">50</abbr><abbr bid="B51">51</abbr><abbr bid="B52">52</abbr><abbr bid="B53">53</abbr></abbrgrp>; however, none of these models were analyzed here.</p>
         <p>Of note, many expression patterns detected in this study were observed in only one species (Additional data file 5), and it is possible that some of these differences may arise from technical limitations rather than reflect important biological differences. Comparison between two expression datasets, especially when derived from different species, remains a technical challenge. Thus, we acknowledge the possibility that artifacts may have been introduced depending on the data analysis methodology. However, we are confident that the analyses described here identified many common and biologically relevant clusters, including a proliferation, basal epithelial, interferon-regulated and fibroblast signature, thus showing that the act of data combining across species did retain important features present within the individual datasets. There are many murine models of breast cancer that we did not look at in this study and many more will be developed. Like the 13 models we discussed here, we would expect that some of these models will have overlapping gene expression patterns with human subtypes while others will not. We believe that additional studies with larger numbers of samples, including more diversity from each species, is warranted. These analyses do confirm the notion that there is not a single murine model that perfectly represents a human breast cancer subtype; however, the murine models do show shared features with specific human subtypes and it is these commonalties that will lay the groundwork for many future studies.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Murine and human tumors</p>
            </st>
            <p>The murine tumor samples were obtained from multiple participating investigators, who all maintained the mice and harvested the murine tumors in the 0.5-1 cm stage following internationally recognized guidelines. The details concerning strain background, promoter, transgene, and specific alleles, and so on, are provided in Additional data file 1. All human tumor samples were collected from fresh frozen primary breast tumors using Institutional Review Board (IRB)-approved protocols and were profiled as described in <abbrgrp><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr></abbrgrp>. The clinical and pathological information for these human samples can be obtained at the University of North Carolina Microarray Database (UMD) <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Microarray experiments</p>
            </st>
            <p>Total RNA was collected from murine tumors, and wild-type mammary samples of both FVB and BALB/c inbred strains. RNA was purified using the RNeasy Mini Kit (Qiagen Inc., Valencia, CA, USA) according to the manufacturer's protocol using 20-30 mg tissue. RNA integrity was assessed using the RNA 6000 Nano LabChip kit followed by analysis using a Bioanalyzer (Agilent Technologies Inc., Santa Clara, CA, USA). Total RNA (2.5 &#956;g) was reverse transcribed, amplified and labeled with Cy5 using a Low RNA Input Amplification kit (Agilent). The common reference RNA sample for these experiments consisted of total RNA harvested from equal numbers of C57Bl6/J and 129 male and female day 1 pups (a gift from Dr Cam Patterson, UNC). The reference RNA was reverse transcribed, amplified, and labeled with Cy3. The amplified sample and reference were co-hybridized overnight to Agilent Mouse Oligo Microarrays (G4121A). They were then washed and scanned on a GenePix 4000B scanner (Molecular Devices Corporation, Sunnyvale, CA, USA), analyzed using GenePix 4.1 software and uploaded into our database where a Lowess normalization is automatically performed.</p>
         </sec>
         <sec>
            <st>
               <p>Microarray data analysis</p>
            </st>
            <p>All primary microarray data are available from the UMD <abbrgrp><abbr bid="B54">54</abbr></abbrgrp>, and at the Gene Expression Omnibus under the series GSE3165 (mouse and new human data), GSE1992, GSE2740 and GSE2741 (previously published human data) <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>. The genes for all analyses were filtered by requiring the Lowess normalized intensity values in both channels to be > 30. The log<sub>2 </sub>ratio of Cy5/Cy3 was then reported for each gene. In the final dataset, only genes that reported values in 70% or more of the samples were included. The genes were median centered and then hierarchical clustering was performed using Cluster v2.12 <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. For the murine unsupervised analysis, and human-mouse unsupervised cluster analyses, we filtered for genes that varied at least three-fold or more, in at least three or more samples. Average linkage clustering was performed on genes and arrays and cluster viewing and display was performed using JavaTreeview v1.0.8 <abbrgrp><abbr bid="B57">57</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Mouse Intrinsic gene set analysis</p>
            </st>
            <p>Intrinsic 'groups' of experimental samples were chosen based upon having a Pearson correlation value of 0.65 or greater from the unsupervised clustering analysis of the 122 murine samples. The analysis was performed using the Intrinsic Gene Identifier v1.0 by Max Diehn/Stanford University <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Technical replicates were removed from the file and the members of every highly correlated node were given identical class numbers, giving every sample that fell outside the 0.65 correlation cut-off a class of their own. Using these criteria, 16 groups of samples were identified (see Additional data file 1 for these groups) and a list of 866 'intrinsic' genes was selected using the criteria of one standard deviation below the mean intrinsic gene value. A human intrinsic list of 1,300 genes was created using a subset of 146 of the 232 samples used here, and is described in Hu <it>et al</it>. <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Consensus clustering</p>
            </st>
            <p>CC <abbrgrp><abbr bid="B20">20</abbr></abbrgrp> was performed locally using Gene Pattern 1.3.1 (built Jan 6, 2005), which was downloaded from the Broad Institute distribution website <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Analyses were performed on the mouse dataset with all genes, and just with intrinsic genes separately. Ranges for the number of K clusters (or the focused number of classes) were from 2 to 15 to evaluate a wide range of possible groups. Using a Euclidian distance measure with average linkage, we re-sampled 1,000 times with both column and row normalization.</p>
         </sec>
         <sec>
            <st>
               <p>Combining murine and human expression datasets</p>
            </st>
            <p>Orthologous genes were reported by Mouse Genome Informatics (MGI 3.1) of The Jackson Laboratory. For both the human and murine datasets, Locus Link IDs assigned to Agilent oligo probe ID numbers were used to assign to MGI ID numbers. In cases where a single gene was represented by multiple probes, the median value of the redundant probes was used. This led to a total of orthologous pairings of 14,680 Agilent probes. Prior to combining the two datasets, each was column standardized to N(0,1), row median centered, and probe identifiers were converted to MGI IDs. The intersection of mouse and human MGI identifiers from genes that passed filters (same as used above) in both datasets yielded 7,907 orthologous genes in the total combined dataset. This dataset was next corrected for systemic biases using distance weighted discrimination <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. Finally, the combined dataset was used for an average linkage hierarchical clustering analysis.</p>
         </sec>
         <sec>
            <st>
               <p>Gene set enrichment analysis</p>
            </st>
            <p>We took the 232 human samples and classified them as basal-like, luminal, HER2+/ER-, claudin-low, and normal breast-like according to a clustering analysis of the human dataset only (Additional data file 6), using the new intrinsic/UNC human gene list developed in Hu <it>et al</it>. <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. Second, the murine samples were also classified based upon their clustering pattern in Figure <figr fid="F1">1</figr> that used the mouse intrinsic gene list, and were assigned to Groups I-X. Two-class unpaired SAM analysis was performed for each murine class separately versus all other classes using an FDR of 1% <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>, resulting in 10 class-specific gene lists. Using only the set of highly expressed genes that were associated with each analysis (and ignoring the genes whose low expression correlated with a given class), GSEA <abbrgrp><abbr bid="B35">35</abbr></abbrgrp> was performed in R (v. 2.0.1) using the GSEA R package <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>. The ten murine gene sets were then compared to each human subtype-ranked gene set and significant enrichments reported. For statistical strength of these enrichments, GSEA uses family wise error rate (FWER) to correct for multiple testing and FDR to reduce false positive reporting. The parameters used for all GSEA were: nperm = 1,000, weighted.score.type = 1, nom.p.val.threshold = -1, fwer.p.val.threshold = -1, fdr.q.val.threshold = 0.25, topgs = 12, adjust.FDR.q.val = FALSE, gs.size.threshold.min = 25, gs.size.threshold.max = 2,000, reverse.sign = FALSE, preproc.type = 0, random.seed = 3,338, perm.type = 0, fraction = 1, replace = FALSE.</p>
         </sec>
         <sec>
            <st>
               <p>Immunofluorescence</p>
            </st>
            <p>Paraffin-embedded sections (5 &#956;m thick) were processed using standard immunostaining methods. The antibodies and their dilution were &#945;-cytokeratin 5 (K5, 1:8,000, PRB-160P, Covance, Berkeley, CA, USA), and &#945;-cytokeratins 8/18 (Ker8/18, 1:450, GP11, Progen Biotecknik, Heidelberg, Germany). Briefly, slides were deparaffinized and hydrated through a series of xylenes and graded ethanol steps. Heat-mediated epitope retrieval was performed in boiling citrate buffer (pH 6.0) for 15 minutes, then samples cooled to room temperature for 30 minutes. Secondary antibodies for immunofluorescence were conjugated with Alexa Fluor-488 or -594 fluorophores (1:200, Molecular Probes, Invitrogen, Carlsbad, CA, USA). IF samples were mounted with VectaShield Hardset with DAPI mounting media (Vector, Burlingame, CA, USA).</p>
         </sec>
         <sec>
            <st>
               <p>Human KRAS2 amplification assay</p>
            </st>
            <p>We performed real-time quantitative PCR and fluorescent melting curve analyses using genomic DNAs from 16 basal-like tumors, a normal breast tissue sample, 2 leukocyte DNA, and 3 luminal tumors. DNA was extracted using the DNAeasy kit (Qiagen) and amplification was performed on the LightCycler using the following temperature parameters: 95&#176;C, 8 minutes; 50 cycles of 57&#176;C, 6 s; 72&#176;C, 6 s; 95&#176;C, 2 s; followed by cooling to 60&#176;C and a 0.1&#176;C/s ramp to 97&#176;C. Each PCR reaction contained 7.5 ng template DNA in a 10 &#956;l reaction using the LightCycler Faststart DNA Master SYBR Green I kit (Roche Applied Science, Indianapolis, IN, USA). Relative DNA copy number for each gene was determined by importing an external efficiency curve and using a 'normal' breast sample for a within-run calibrator. For each sample, the copy number for KRAS2 was divided by the average copy number of ACTB and G1P3. Amplification in any tumor was called if the relative fold change was greater than three standard deviations above the average of five control samples (two normal leukocyte samples and three luminal tumors).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper. Additional data file <supplr sid="S1">1</supplr> is a table listing mouse tumor and normal sample associated data, including source, transgene and promoter information. Additional data file <supplr sid="S2">2</supplr> is a complete unsupervised cluster diagram of all mouse tumors. Samples are colored according to mouse model from which they were derived, and the genes were selected using a variation filter of three-fold or more on three or more samples. Additional data file <supplr sid="S3">3</supplr> ia a complete mouse models cluster diagram using the 866 gene murine intrinsic gene list. Additional data file <supplr sid="S4">4</supplr> provides CC analyses applied to the mouse models. <b>(a) </b>CC matrices generated using the 866 gene mouse intrinsic list, by cluster numbers K = 2 through K = 15. <b>(b) </b>Empirical cumulative distribution (CDF) plot corresponding to the consensus matrices in the range K = 2 to 15. <b>(c) </b>CC directly compared to the hierarchical clustering-based results. The dendrogram from Figure <figr fid="F1">1</figr> (using the intrinsic gene set) is shown and immediately below is a colored matrix showing sample assignments based upon the various number of K clusters from the CC. By comparison, the analysis performed on the mouse dataset using all genes (bottom matrix) is presented. Additional data file <supplr sid="S5">5</supplr> is a complete unsupervised cluster diagram of the combined gene expression patterns of 232 human breast tumor samples and 122 mouse mammary tumor samples. This unsupervised cluster analysis is based upon the orthologous gene overlap between the human and mouse microarrays, and then we selected for the subset of genes that varied three-fold or more on three or more arrays. Additional data file <supplr sid="S6">6</supplr> shows a cluster analysis of the 232 human samples using the human intrinsic/UNC gene set from Hu <it>et al</it>. <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. This analysis was used to determine a human samples subtype (basal-like, luminal, HER2+/ER-, and so on), which was then used in the various SAM and GSEA analyses. Samples are colored according to their subtype: red = basal-like, blue = luminal, pink = HER2+/ER-, yellow = claudin-low and green = normal breast-like. Additional data file <supplr sid="S7">7</supplr> shows a histological characterization of six different human 'claudin-low' tumors using hematoxylin and eosin sections. Additional data file <supplr sid="S8">8</supplr> shows GSEA of murine pathway models versus five human subtypes. Additional data file <supplr sid="S9">9</supplr> shows GSEA of ten murine classes versus clinical ER status and HER2 status in ER negative patients. Additional data file <supplr sid="S10">10</supplr> shows GSEA of murine pathway models versus clinical ER status and HER2 status in ER negative patients.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Mouse tumor and normal sample associated data including source, transgene and promoter information</p>
            </caption>
            <text>
               <p>Mouse tumor and normal sample associated data including source, transgene and promoter information.</p>
            </text>
            <file name="gb-2007-8-5-r76-S1.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>Complete unsupervised cluster diagram of all mouse tumors</p>
            </caption>
            <text>
               <p>Samples are colored according to mouse model from which they were derived, and the genes were selected using a variation filter of three-fold or more on three or more samples.</p>
            </text>
            <file name="gb-2007-8-5-r76-S2.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>Complete mouse models cluster diagram using the 866 gene murine intrinsic gene list</p>
            </caption>
            <text>
               <p>Complete mouse models cluster diagram using the 866 gene murine intrinsic gene list.</p>
            </text>
            <file name="gb-2007-8-5-r76-S3.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>CC analyses applied to the mouse models</p>
            </caption>
            <text>
               <p><b>(a) </b>CC matrices generated using the 866 gene mouse intrinsic list, by cluster numbers K = 2 through K = 15. <b>(b) </b>Empirical cumulative distribution (CDF) plot corresponding to the consensus matrices in the range K = 2 to 15. <b>(c) </b>CC directly compared to the hierarchical clustering-based results. The dendrogram from Figure <figr fid="F1">1</figr> (using the intrinsic gene set) is shown and immediately below is a colored matrix showing sample assignments based upon the various number of K clusters from the CC. By comparison, the analysis performed on the mouse dataset using all genes (bottom matrix) is presented.</p>
            </text>
            <file name="gb-2007-8-5-r76-S4.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>Complete unsupervised cluster diagram of the combined gene expression patterns of 232 human breast tumor samples and 122 mouse mammary tumor samples</p>
            </caption>
            <text>
               <p>This unsupervised cluster analysis is based upon the orthologous gene overlap between the human and mouse microarrays, and then we selected for the subset of genes that varied three-fold or more on three or more arrays.</p>
            </text>
            <file name="gb-2007-8-5-r76-S5.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>Cluster analysis of the 232 human samples using the human intrinsic/UNC gene set from <abbrgrp><abbr bid="B21">21</abbr></abbrgrp></p>
            </caption>
            <text>
               <p>This analysis was used to determine a human samples subtype (basal-like, luminal, HER2+/ER-, and so on), which was then used the various SAM and GSEA analyses. Samples are colored according to their subtype: red = basal-like, blue = luminal, pink = HER2+/ER-, yellow = claudin-low and green = normal breast-like.</p>
            </text>
            <file name="gb-2007-8-5-r76-S6.pdf">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>Histological characterization of six different human 'claudin-low' tumors using hematoxylin and eosin sections</p>
            </caption>
            <text>
               <p>Histological characterization of six different human 'claudin-low' tumors using hematoxylin and eosin sections.</p>
            </text>
            <file name="gb-2007-8-5-r76-S7.tiff">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S8">
            <title>
               <p>Additional data file 8</p>
            </title>
            <caption>
               <p>GSEA of murine pathway models versus five human subtypes</p>
            </caption>
            <text>
               <p>GSEA of murine pathway models versus five human subtypes.</p>
            </text>
            <file name="gb-2007-8-5-r76-S8.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S9">
            <title>
               <p>Additional data file 9</p>
            </title>
            <caption>
               <p>GSEA of ten murine classes versus clinical ER status and HER2 status in ER negative patients</p>
            </caption>
            <text>
               <p>GSEA of ten murine classes versus clinical ER status and HER2 status in ER negative patients.</p>
            </text>
            <file name="gb-2007-8-5-r76-S9.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S10">
            <title>
               <p>Additional data file 10</p>
            </title>
            <caption>
               <p>GSEA of murine pathway models versus clinical ER status and HER2 status in ER negative patients</p>
            </caption>
            <text>
               <p>GSEA of murine pathway models versus clinical ER status and HER2 status in ER negative patients.</p>
            </text>
            <file name="gb-2007-8-5-r76-S10.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>CMP was supported by funds from the NCI Breast SPORE program to UNC-CH (P50-CA58223-09A1), by NCI (RO1-CA-101227-01), by the Breast Cancer Research Foundation and by HHSN-261200433008C (N01-CN43308). KS was supported by a grant from NIEHS (T32 ES07017) and TVD was supported by NCI (RO1-CA046283-16). RG was supported by NO1-CN15044, and PAF was supported by NO1-CN-05024/CN/NCI. This research was supported in part by a grant from the Susan G Komen Breast Cancer Foundation (LPJ and SA). PHB was supported by funds from RO1-CA101211. We thank Beverly H Koller and Daniel Medina for generously providing tumor samples, and Ronald Lubet for assistance in obtaining murine tumor samples.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Molecular portraits of human breast tumours.</p>
            </title>
            <aug>
               <au>
                  <snm>Perou</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>S&#248;rlie</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Eisen</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>van de Rijn</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jeffrey</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Rees</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Pollack</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Ross</snm>
                  <fnm>DT</fnm>
               </au>
               <au>
                  <snm>Johnsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Akslen</snm>
                  <fnm>LA</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>406</volume>
            <fpage>747</fpage>
            <lpage>752</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35021093</pubid>
                  <pubid idtype="pmpid" link="fulltext">10963602</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Gene expression patterns of breast carcinomas distinguish tumor subclasses with clinical implications.</p>
            </title>
            <aug>
               <au>
                  <snm>Sorlie</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Perou</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Tibshirani</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Aas</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Geisler</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Johnsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Hastie</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Eisen</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>van de Rijn</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jeffrey</snm>
                  <fnm>SS</fnm>
               </au>
               <etal/>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2001</pubdate>
            <volume>98</volume>
            <fpage>10869</fpage>
            <lpage>10874</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">58566</pubid>
                  <pubid idtype="pmpid" link="fulltext">11553815</pubid>
                  <pubid idtype="doi">10.1073/pnas.191367098</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Repeated observation of breast tumor subtypes in independent gene expression datasets.</p>
            </title>
            <aug>
               <au>
                  <snm>Sorlie</snm>
                  <fnm>T</fnm>
               </au>
               <au>
          