<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2008-9-6-r93</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Method</dochead>
      <bibl>
         <title>
            <p>A mouse plasma peptide atlas as a resource for disease proteomics</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Zhang</snm>
               <fnm>Qing</fnm>
               <insr iid="I1"/>
               <email>qing@fhcrc.org</email>
            </au>
            <au id="A2">
               <snm>Menon</snm>
               <fnm>Rajasree</fnm>
               <insr iid="I2"/>
               <email>rajmenon@umich.edu</email>
            </au>
            <au id="A3">
               <snm>Deutsch</snm>
               <mi>W</mi>
               <fnm>Eric</fnm>
               <insr iid="I3"/>
               <email>edeutsch@systemsbiology.org</email>
            </au>
            <au id="A4">
               <snm>Pitteri</snm>
               <mi>J</mi>
               <fnm>Sharon</fnm>
               <insr iid="I1"/>
               <email>spitteri@fhcrc.org</email>
            </au>
            <au id="A5">
               <snm>Faca</snm>
               <mi>M</mi>
               <fnm>Vitor</fnm>
               <insr iid="I1"/>
               <email>vfaca@fhcrc.org</email>
            </au>
            <au id="A6">
               <snm>Wang</snm>
               <fnm>Hong</fnm>
               <insr iid="I1"/>
               <email>hongwang@fhcrc.org</email>
            </au>
            <au id="A7">
               <snm>Newcomb</snm>
               <mi>F</mi>
               <fnm>Lisa</fnm>
               <insr iid="I1"/>
               <email>lnewcomb@fhcrc.org</email>
            </au>
            <au id="A8">
               <snm>DePinho</snm>
               <mi>A</mi>
               <fnm>Ronald</fnm>
               <insr iid="I4"/>
               <insr iid="I5"/>
               <email>ron_depinho@dfci.harvard.edu</email>
            </au>
            <au id="A9">
               <snm>Bardeesy</snm>
               <fnm>Nabeel</fnm>
               <insr iid="I6"/>
               <email>nelbardeesy@partners.org</email>
            </au>
            <au id="A10">
               <snm>Dinulescu</snm>
               <fnm>Daniela</fnm>
               <insr iid="I7"/>
               <email>ddinulescu@rics.bwh.harvard.edu</email>
            </au>
            <au id="A11">
               <snm>Hung</snm>
               <mi>E</mi>
               <fnm>Kenneth</fnm>
               <insr iid="I6"/>
               <email>khung@partners.org</email>
            </au>
            <au id="A12">
               <snm>Kucherlapati</snm>
               <fnm>Raju</fnm>
               <insr iid="I6"/>
               <email>rkucherlapati@partners.org</email>
            </au>
            <au id="A13">
               <snm>Jacks</snm>
               <fnm>Tyler</fnm>
               <insr iid="I8"/>
               <email>tjacks@mit.edu</email>
            </au>
            <au id="A14">
               <snm>Politi</snm>
               <fnm>Katerina</fnm>
               <insr iid="I9"/>
               <email>politik@mskcc.org</email>
            </au>
            <au id="A15">
               <snm>Aebersold</snm>
               <fnm>Ruedi</fnm>
               <insr iid="I3"/>
               <insr iid="I10"/>
               <email>raebersold@systemsbiology.org</email>
            </au>
            <au id="A16">
               <snm>Omenn</snm>
               <mi>S</mi>
               <fnm>Gilbert</fnm>
               <insr iid="I2"/>
               <email>gomenn@umich.edu</email>
            </au>
            <au id="A17">
               <snm>States</snm>
               <mi>J</mi>
               <fnm>David</fnm>
               <insr iid="I2"/>
               <email>dstates@umich.edu</email>
            </au>
            <au id="A18">
               <snm>Hanash</snm>
               <mi>M</mi>
               <fnm>Samir</fnm>
               <insr iid="I1"/>
               <email>shanash@fhcrc.org</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Fred Hutchinson Cancer Research Center, Seattle, WA 98109, USA</p>
            </ins>
            <ins id="I2">
               <p>Center for Computational Medicine and Biology, University of Michigan, Ann Arbor, MI 48109, USA</p>
            </ins>
            <ins id="I3">
               <p>Institute for Systems Biology, Seattle, WA 98103, USA</p>
            </ins>
            <ins id="I4">
               <p>Dana-Farber Cancer Institute, Harvard Cancer Center, Boston, MA 02115, USA</p>
            </ins>
            <ins id="I5">
               <p>Center for Applied Cancer Science, Belfer Institute for Innovative Cancer Science, Department of Medical Oncology, Medicine, Genetics, Dana-Farber Cancer Institute, Harvard Medical School, Boston, MA 02114, USA</p>
            </ins>
            <ins id="I6">
               <p>Massachusetts General Hospital, Harvard Medical School, Boston, MA 02114, USA</p>
            </ins>
            <ins id="I7">
               <p>Brigham and Women's Hospital, Harvard Medical School, Boston, MA 02115, USA</p>
            </ins>
            <ins id="I8">
               <p>Center for Cancer Research, Massachusetts Institute of Technology, Cambridge, MA 02139, USA</p>
            </ins>
            <ins id="I9">
               <p>Memorial Sloan-Kettering Cancer Center, New York, NY 10021, USA</p>
            </ins>
            <ins id="I10">
               <p>Institute of Molecular Systems Biology, ETH Zurich and Faculty of Science, University of Zurich, 8093 Zurich, Switzerland</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>6</issue>
         <fpage>R93</fpage>
         <url>http://genomebiology.com/2008/9/6/R93</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">18522751</pubid>
               <pubid idtype="doi">10.1186/gb-2008-9-6-r93</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>30</day>
               <month>1</month>
               <year>2008</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>4</day>
               <month>4</month>
               <year>2008</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>3</day>
               <month>6</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>03</day>
               <month>06</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Zhang et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Mouse plasma peptide atlas</p>
      </shorttitle>
      <shortabs>
         <p>A publicly available repository for high-quality peptide and protein data, identified by LC-MS/MS analysis.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <p>We present an in-depth analysis of mouse plasma leading to the development of a publicly available repository composed of 568 liquid chromatography-tandem mass spectrometry runs. A total of 13,779 distinct peptides have been identified with high confidence. The corresponding approximately 3,000 proteins are estimated to span a 7 logarithmic range of abundance in plasma. A major finding from this study is the identification of novel isoforms and transcript variants not previously predicted from genome analysis.</p>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010013">Methods</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010015">Model organisms</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>In-depth analysis of the plasma proteome has the potential to yield biomarkers that allow early disease detection, and monitoring of disease progression, regression or recurrence. Mouse models have provided a physiological context in which to explore various aspects of disease pathogenesis and complement the use of cell line models and tissue sampling approaches. Genetically engineered mouse models have been increasingly relied upon to investigate specific molecular alterations associated with human disease. Recent transcriptional profiling and comparative genomic analyses of human and mouse cancers have revealed significant concordance in genomic alterations and expression profiles, thus justifying reliance on mouse models to identify molecular alterations and markers potentially relevant to human cancers and other diseases <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>.</p>
         <p>Genetically engineered mouse models allow investigations of proteomic changes at defined stages of disease development, and exhibit reduced heterogeneity, thus providing greater ease of standardization of blood and tissue sampling and preparation. However, there has been limited comprehensive analysis to date of the mouse plasma proteome. Studies of disease related plasma protein alterations in the mouse will benefit from a publicly available plasma proteome database that assembles high quality queryable data and that informs about the extent of protein variation encompassed within the mouse proteome.</p>
         <p>Previous studies of mouse proteomes include a large-scale study of mouse liver tissue that identified 3,244 proteins <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. A comparative proteomics study of tumor and normal mammary tissue from a conditional HER2/Neu-driven mouse model of breast cancer identified changes in tissue proteins leading to the identification of up-regulated fibulin-2 and osteopontin in mouse plasma <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. A study of the plasma proteome in a mouse intestinal tumor model identified a protein subset that distinguished tumor bearing mice from controls <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>.</p>
         <p>We have implemented a proteomic strategy that allows in-depth analysis of the plasma proteome. We have applied this to protein digests of fractionated mouse plasma reference specimens to determine protein and peptide constituents of mouse plasma and have built a related data repository. A large number of novel transcript variants for mouse plasma proteins have been identified. The data are publicly available at the PeptideAtlas site <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, which can be viewed and searched. The raw data as well as the search results are also available for download from the 'Data Repository' page of the same site.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Identification of 13,779 distinct peptides in mouse plasma</p>
            </st>
            <p>Four mouse reference plasma pools were each subjected to extensive fractionation and separate liquid chromatography-tandem mass spectrometry (LC-MS/MS) analysis of digests from individual fractions. The combined four experiments yielded 800,507 spectra with a PeptideProphet <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> probability (P) score of &#8805;0.9 from a total of 568 LC-MS/MS runs. The overall false discovery rate for spectrum assignment was calculated to be 1.2% based on PeptideProphet cutoffs. Of the 13,779 distinct peptides with P &#8805;0.9 encompassed in the analysis, 13,461 peptides were successfully mapped to the Ensembl Mouse <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> release 43, which was built on the NCBI m36 mouse assembly. Of the set of 13,779 distinct peptides, 9,170 (67%) were identified with at least 2 spectra. Cys-containing, Trp-containing, and Lys-containing peptides represented 3,709 (27%), 2,067 (15%), and 8,392 (61%) of the total peptides, respectively (Table <tblr tid="T1">1</tblr>).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Summary of peptides identified with a PeptideProphet P score &#8805;0.9</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>Peptide</p>
                     </c>
                     <c ca="center">
                        <p>Counts</p>
                     </c>
                     <c ca="center">
                        <p>Percentage</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total assignment above threshold</p>
                     </c>
                     <c ca="center">
                        <p>800,507</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total correct assignment</p>
                     </c>
                     <c ca="center">
                        <p>791,069</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total incorrect assignment</p>
                     </c>
                     <c ca="center">
                        <p>9,438</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Spectrum assignment false discovery rate</p>
                     </c>
                     <c ca="center">
                        <p>0.012</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides</p>
                     </c>
                     <c ca="center">
                        <p>13,779</p>
                     </c>
                     <c ca="center">
                        <p>100.00</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Distinct peptides mapped to human genome</p>
                     </c>
                     <c ca="center">
                        <p>13,461</p>
                     </c>
                     <c ca="center">
                        <p>97.69</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Possible proteins implicated in mapping</p>
                     </c>
                     <c ca="center">
                        <p>10,674</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Simple reduced proteins</p>
                     </c>
                     <c ca="center">
                        <p>4,084</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Simple reduced genes</p>
                     </c>
                     <c ca="center">
                        <p>3,580</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Unambiguously mapped proteins</p>
                     </c>
                     <c ca="center">
                        <p>1,590</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides, presented in &#8805;2 samples</p>
                     </c>
                     <c ca="center">
                        <p>9,170</p>
                     </c>
                     <c ca="center">
                        <p>66.55</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total singleton distinct peptides</p>
                     </c>
                     <c ca="center">
                        <p>4,609</p>
                     </c>
                     <c ca="center">
                        <p>33.45</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cys-containing distinct peptides</p>
                     </c>
                     <c ca="center">
                        <p>3,709</p>
                     </c>
                     <c ca="center">
                        <p>26.92</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Trp-containing distinct peptides</p>
                     </c>
                     <c ca="center">
                        <p>2,067</p>
                     </c>
                     <c ca="center">
                        <p>15.00</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lys-containing distinct peptides</p>
                     </c>
                     <c ca="center">
                        <p>8,392</p>
                     </c>
                     <c ca="center">
                        <p>60.90</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides from colon cancer versus normal</p>
                     </c>
                     <c ca="center">
                        <p>5,958</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides from breast cancer versus normal</p>
                     </c>
                     <c ca="center">
                        <p>8,874</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides from pancreatic cancer versus normal</p>
                     </c>
                     <c ca="center">
                        <p>7,753</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides from ovarian cancer versus normal</p>
                     </c>
                     <c ca="center">
                        <p>5,368</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides in all four reference sets</p>
                     </c>
                     <c ca="center">
                        <p>2,897</p>
                     </c>
                     <c ca="center">
                        <p>21.02</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides in three reference sets</p>
                     </c>
                     <c ca="center">
                        <p>1,534</p>
                     </c>
                     <c ca="center">
                        <p>11.13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total distinct peptides in two reference sets</p>
                     </c>
                     <c ca="center">
                        <p>2,415</p>
                     </c>
                     <c ca="center">
                        <p>17.53</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>The mean peptide length for the 13,779 peptide set was 16, with a range of 6-49 amino acids. There was a bias in the distribution of peptide length, which favored relatively long peptides (Figure <figr fid="F1">1</figr>). A similar finding from human proteome studies was previously reported <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. The under-representation of short peptides may result from losses due to reduced sequence-specific fragment ions, or difficulty in distinguishing them from noise due to low m/z values. The mean molecular weight of this set was approximately 1,750 Da with a range of 640-4,100 Da. The majority of peptides identified were either neutral or acidic, with an average pI of approximately 6. There were 5958, 8874, 7753, and 5368 distinct peptides identified for the 4 reference sets (Table <tblr tid="T1">1</tblr>). The number of peptides identified may relate to variability in protein levels between reference sets, particularly for abundant proteins, which affects mass spectrometer peptide sampling and variability in protein recovery with sample processing.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Characterization of distinct peptides identified from mouse plasma reference sets</p>
               </caption>
               <text>
                  <p>Characterization of distinct peptides identified from mouse plasma reference sets. The histogram of peptide length of unique sequences in mouse PeptideAtlas (blue) is overlaid on an <it>in silico </it>tryptic digest of the IPI mouse database (black).</p>
               </text>
               <graphic file="gb-2008-9-6-r93-1"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Identification of 2,982 proteins in mouse plasma using ProteinProphet</p>
            </st>
            <p>A combined search of data from all four reference sets was done using ProteinProphet <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. This yielded 2,982 distinct International Protein Index (IPI) identifications corresponding to 2,631 known genes plus 281 hypothetical proteins with an error rate less than 5%. Among these, 2,131 (71%) proteins were identified with at least 3 unique peptides, 2,600 (87%) with at least 2 unique peptides, and 382 with only one unique peptide (singlets, 13%). Among these singlets, 140 (37%) were observed only once within the whole study, and thus are likely the major source of false identifications. Cytoplasmic proteins contributed the most, at approximately 29%; extracellular, nucleus, and plasma membrane proteins accounted for 17%, 17%, and 14%, respectively, based on ingenuity pathway analysis <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. The limited contribution of secreted and surface membrane proteins to the overall total may be the result of release through non-secreted pathways and cell turnover. The tissue distribution and gene expression levels of this set of proteins was investigated based on the mouse SymAtlas (Novartis Research Foundation) <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. The tissue with the maximum expression for a given gene was assigned to that particular gene. Approximately 8% of identified proteins had the highest expression of their corresponding genes represented by liver (mRNA per gram tissue), which is considered a major source of abundant plasma proteins. The range of MS/MS events corresponding to high confidence protein identifications based on two peptides or more varied between approximately 50,000 and 2. We previously observed a significant correlation between the number of MS/MS events for a given protein and its plasma protein concentration (log(MS/MS events) = (0.623 &#215; log(Protein concentration)) + 0.0625) (unpublished data). We infer, therefore, that abundance of mouse plasma proteins identified in this study may span a logarithmic range of 7.</p>
         </sec>
         <sec>
            <st>
               <p>Occurrence of cleaved protein forms</p>
            </st>
            <p>Proteins undergo numerous post-translational modifications, notably cleavages in the case of proteins shed into the circulation. The mouse PeptideAtlas may be queried to determine the distribution of peptides identified for a given protein and the occurrence of cleaved forms in particular fractions. This is illustrated for the epidermal growth factor receptor (EGFR), which is a single-pass type I membrane protein <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, as an example of the depth of analysis achieved and of the capabilities of the mouse PeptideAtlas. Detection of over-expressed EGFR is of relevance to a number of disease processes <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. The trans-membrane region is located at amino acids 646-668, and the extracellular domain is between amino acids 25-645 (Figure <figr fid="F2">2</figr>). A total of over 4,000 MS2 events in mouse PeptideAtlas corresponding to EGFR matched 34 distinct peptides that spanned exclusively the extracellular domain of the protein, resulting from cleavage and release of this domain. The PeptideAtlas provides a graphic interface for protein fragmentation and can be used as a tool for comparisons between different species. Of interest, one peptide derived from mouse EGFR, PAp00148806 (IPLENLQIIR amino acids 99-108, lab 34), was also identified in the PeptideAtlas analysis of the Human Proteome Organization (HUPO) human plasma samples as the mouse and the human share the same sequence for this peptide <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Peptide identification and distribution of mouse EGFR</p>
               </caption>
               <text>
                  <p>Peptide identification and distribution of mouse EGFR. A total of 34 distinct peptides were identified from approximately 4,000 MS2 events. All peptides are from the extracellular domain.</p>
               </text>
               <graphic file="gb-2008-9-6-r93-2"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Observed splice isoforms</p>
            </st>
            <p>Approximately 3,000 distinct peptides were identified that spanned exon boundaries, of which 1,717 were observed at least twice. Among these, 180 peptides were observed in all 4 mouse plasma pools/experiments, and mapped to proteins with a unique genome location. The database represents a useful resource for validation of splice isoforms predicted in the Ensembl mouse genome. For example, PAp00024736, with a peptide sequence DQGSCGSCWAFGAVEAISDR, was mapped to a single protein cathepsin B precursor with a unique genome location on mouse chromosome 14. This peptide was observed a total of 39 times in multiple fractions and in all 4 experiments. The first nine amino acids (DQGSCGSCW) covered one exon from genome location 62089806 to 62089832, while the rest (AFGAVEAISDR) were located on another exon at genome location 62090517 to 62090549. Cathepsin B regulates the hydrolysis of proteins with broad specificity for peptide bonds <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>.</p>
            <p>A list of approximately 950 peptides that did not map to any annotated gene in the mouse genome was developed, with an overall 1.7% false discovery rate for peptide identification. These represent putative novel open reading frames. The majority (61%) had at least two observations. One example is PAp00438183, with a sequence of RPQMVEGDHGDEIFSVFGAPLLK, which was identified over 300 times and in all 4 experiments. The peptide was mapped to a single protein, IPI00138342, the liver carboxylesterase N precursor. Its sequence matched to the coding region of this protein on chromosome 8 with 91% identity.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of novel alternative splice isoforms</p>
            </st>
            <p>Alternative splicing plays a major role in protein diversity without significantly increasing genome size. Aberrations in alternative splice variants are known to contribute to a number of diseases <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. As highlighted recently in the Encode project <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, the extent of transcript structural variation in mammalian genomes has been under-appreciated. To identify novel splice isoforms that are translated into protein products, we interrogated the intact protein analysis system (IPAS; see Materials and methods) data sets using a protein sequence collection containing the products of both known and hypothetical transcripts.</p>
            <p>A target database with over 10 million sequences was built upon the ECgene <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> and Ensembl mouse <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> databases as described in Materials and methods and in Fermin <it>et al</it>. <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. An extensive computational analysis for a reference set was done to identify novel forms. Using a X!Tandem expect value of &lt;1e-3 as a threshold, we identified a total of 12,461 proteins and 8,154 distinct peptides matching 147,051 spectra in the target database. Among these, 7,291 distinct peptides (90%) were in multi-peptide sets and 863 (10%) in single peptide identification sets. At this threshold, 81 distinct reversed sequence proteins (0.65%) and 53 reversed sequence peptides (0.65%) matched 69 distinct spectra.</p>
            <p>The splice isoforms derived from a gene share exons with each other. Further, specific peptides may occur in several members of a paralogous family of proteins. To obtain a measure of the number of independent protein identifications, it is necessary to integrate protein identifications into covering sets (see Materials and methods). To be included in the integrated protein list, peptide spectral matches need to be unique and not explained by another protein in the list. The integrated list for the set of protein identifications including novel splice isoform translation products contained a total of 1,324 distinct proteins. Multiple splice isoforms were identified for a number of proteins that have been suggested as potential disease biomarkers in previous studies: Cpn1 (carboxypeptidase N, polypeptide 1), Pzp (pregnancy zone protein), Fabp5 (fatty acid binding protein 5) and Mbl2 (mannose binding lectin) <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. In selecting proteins to be members of the covering sets, our algorithm gives preference to annotated protein sequences. Of the integrated 1,324 protein sets, 1058 (80%) were annotated gene products (that is, proteins in the Ensembl protein collection) and 199 (15%) were found only in the ECGene collection of novel transcripts. Note that in many cases, the set of identifications 'covered' by an annotated protein will also contain proteins derived from previously un-annotated transcripts.</p>
         </sec>
         <sec>
            <st>
               <p>Comparative analysis of mouse and human splice isoforms</p>
            </st>
            <p>We examined mouse splice variants identified as homologues of human counterparts. Similarities were uncovered with human peptides. A case in point is mouse splice variant M13C2563_1_s386_e8960_1_rf2_c1_n0, which was identified with 13 distinct peptides from 19 spectra through the genomic database search. Peptides LLEAQIATGGIIDPK, GFFDPNTEENLTYLQLK, and LNDSILQATEQR were identified by four, three and two spectra, respectively. However, when all 13 peptides were searched against the NCBI NR database using the blastp program, 12 peptides matched to a predicted mouse protein similar to desmoplakin protein. In contrast, all 13 peptides were found to be homologous to the human desmoplakin sequence. The alignment of peptide LLEAQIATGGIIDPK using the UCSC Blast program is shown in Figure <figr fid="F3">3</figr>. This peptide aligns to the coding sequence of human desmoplakin, but not to the annotated mouse desmoplakin gene. Therefore, our data clarify similarities between the mouse and the human coding sequences for this gene. Such detailed analysis of splice variants may identify novel alternative splicing relevant to disease.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Genomic mapping of mouse peptide LLEAQIATGGIIDPK using UCSC Blast program</p>
               </caption>
               <text>
                  <p>Genomic mapping of mouse peptide LLEAQIATGGIIDPK using UCSC Blast program. Mouse splice variant M13C2563_1_s386_e8960_1_rf2_c1_n0 was identified with 13 distinct peptides. Twelve peptides matched a predicted mouse protein similar to desmoplakin using a homolog search against the NCBI NR database. However, all 13 peptides were homologous to the human desmoplakin sequence. Of note, mouse peptide LLEAQIATGGIIDPK aligns to the coding sequence of human desmoplakin, but not to the annotated mouse desmoplakin gene.</p>
               </text>
               <graphic file="gb-2008-9-6-r93-3"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Protein fractionation as a means to characterize splice isoform products</p>
            </st>
            <p>When the protein products of alternative splice isoforms differ in structure, we expect that the physical properties of these proteins, in particular their fraction location, may vary. Finding evidence for non-neighboring fractions with distinct peptide content for the same protein supports the identification of multiple products from the same gene. Figure <figr fid="F4">4</figr> illustrates this analysis for the major histocompatibility complex (MHC) H2 K1 K region antigen. Intact proteins were subjected to anion exchange (AX) and reverse phase (RP) chromatography fractionation in this study. Each fraction was then subjected to tryptic digestion and LC-MS/MS analysis. Figure <figr fid="F4">4</figr> shows the distribution of peptides derived from this gene among the AX and RP chromatography fractions. The unique peptides identified in the major splice isoform and alternative splice variants were found in separate fractions, consistent with translation of the different splice isoforms yielding distinct protein products with distinct physical properties. The MHC H2 K1 K region gene encodes one of the MHC class 1 antigens, which may be altered in tumors <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>IPAS mapping of splice isoform variants for the MHC H2 K1 K gene</p>
               </caption>
               <text>
                  <p>IPAS mapping of splice isoform variants for the MHC H2 K1 K gene. Intact proteins were subjected to anion exchange (AX) and reverse phase (RP) chromatography fractionation. Each fraction was then subjected to tryptic digestion and LC-MS/MS analysis. Peptides derived from novel exons falling within the MHC 2 K1 K gene were identified. Spectral counts for matching peptides derived from this gene are plotted as a function of AX and RP fractionation. The color of each cell indicates the number of matching spectra: black = high; gray = medium; light gray = low; white = zero. <b>(a) </b>The distribution of spectra matching the major annotated splice isoform (ENSMUST00000025181). <b>(b) </b>The distribution of spectra matching the novel splice isoform (M17C4317_13_s2_e917_1_rf2_c1_n0|). <b>(c) </b>The distribution of spectra matching peptides found in both the major annotated splice isoform for this gene (ENSMUST00000025181) and the novel splice isoform (M17C4317_13_s2_e917_1_rf2_c1_n0|).</p>
               </text>
               <graphic file="gb-2008-9-6-r93-4"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Pathway annotation of identified mouse plasma proteins</p>
            </st>
            <p>To determine whether sufficient depth of analysis was achieved to identify proteins that are relevant to disease, we performed ingenuity pathway analysis <abbrgrp><abbr bid="B14">14</abbr></abbrgrp> for 1,058 proteins that were fully annotated to known proteins. A number of known genes may be candidate disease biomarkers based on splice variants. For example, CD44 <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> is a cell-surface glycoprotein that participates in a variety of cellular functions, including tumor metastasis. Alternative splicing generates a diverse collection of structurally and functionally distinct protein products from this gene <abbrgrp><abbr bid="B14">14</abbr><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr></abbrgrp>. CD44 gene products, consisting of three splice isoforms, are found in the integrated set of proteins defined by the lead peptide YGFIEGNVVIPR. This group of 3 splice isoforms was identified with 3 distinct peptides from 14 spectra in our data set. All members of this group included all three peptides.</p>
            <p>The extracellular matrix protein 1 is another example where the major splice isoform and two novel alternative splice isoforms were found in the integrated list. Extracellular matrix protein 1 is a secreted protein that has been implicated in cell proliferation, angiogenesis and differentiation. This protein is preferentially expressed in epithelial tumors and has been suggested as a potential cancer biomarker <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>Our study has yielded an in-depth analysis of mouse plasma resulting in a high quality peptide database built from four reference pools. The mouse plasma PeptideAtlas currently contains more than 800,000 spectra corresponding to 13,000 peptides from approximately 3,000 proteins. Additions are expected from accumulation of new data sets resulting from other instrument platforms or sample processing protocols, other database search algorithms and analysis of disease models.</p>
         <p>The identified proteins span an estimated 7 logarithm range of abundance encompassing prostate specific antigen, estimated to occur in plasma at approximately 1 ng/ml <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>, to abundant plasma proteins present at 40 mg/ml. The ability to detect less abundant proteins is highly relevant to biomarker discovery as most known disease biomarkers occur at low-abundance in the range of prostate specific antigen. Detection of low abundance proteins results from a combination of extensive fractionation of intact proteins using an orthogonal two-dimensional system of AX and RP chromatography, and high resolution LC-MS/MS analysis. The methodology also allows detection of protein cleavage products and splice isoforms.</p>
         <p>Some similarities and some differences between human and mouse plasma have emerged from our analysis. An extensive pattern of cleavage of biological significance has been reported previously for human complement factor C3 <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>, and our data demonstrate similar findings for the mouse. In contrast, for EGFR, a marked difference in abundance based on number of spectra was observed between human (10 spectra) and mouse (>4,000), which may be related to differences in sources of EGFR between mouse and human based on gene expression analysis <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. EGFR has the highest expression in liver in mouse, which is not the case for humans. Alternative splicing is an important source of protein diversity <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr></abbrgrp>, and deep sampling of the plasma proteome as accomplished in this study is relevant to the identification of novel splice isoforms. Variation in the delicately controlled process of splicing may occur in disease states. Alternative splicing in cancer has been investigated on a small scale <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Proteomic data as obtained in this study provide a complementary approach to annotate the genome <abbrgrp><abbr bid="B33">33</abbr><abbr bid="B34">34</abbr></abbrgrp>, and represent a useful resource for the discovery of alternatively spliced forms. We identified novel splice isoforms of known genes as well as previously un-annotated open reading frames <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. An assessment of the relevance of identified splice isoforms as disease biomarkers would be of interest.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>We have developed the mouse plasma PeptideAtlas database, along with its web interface, as a means for depositing mass spectrometry derived protein and peptide identifications in mouse plasma. This initial release contains data derived from 568 LC-MS/MS runs of plasma fractions. A total of 13,779 distinct peptides have been identified with high confidence and are included in this release, which can be searched and downloaded. An important component comprises novel isoforms and transcript variants not previously predicted from genome analysis that have been identified.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Sample preparation and mass spectrometry analysis</p>
            </st>
            <p>The data for the mouse plasma PeptideAtlas was produced from an initial set of four reference plasma samples. Each represented a mixture of plasma from a mouse model of cancer and its matched control as presented in Table <tblr tid="T2">2</tblr>. All experiments were carried out using the IPAS methodology <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>. Pooled plasma samples, immunodepleted of the abundant proteins albumin, IgG, and transferrin using an Ms-3 column (Agilent, Wilmington, DE, USA) were subjected to an extensive two-dimensional fractionation schema using AX chromatography followed by RP chromatography, yielding approximately 150 fractions per plasma pool. Each fraction was subjected to in-solution digestion with trypsin followed by LC-MS/MS analysis on either an LTQ-FT or LTQ-Orbitrap mass spectrometer (Thermo-Finnigan, Waltham, MA, USA) coupled to a nanoAcquity nanoflow chromatography system (Waters, Milford, MA, USA).</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Sources of plasma reference sets</p>
               </caption>
               <tblbdy cols="6">
                  <r>
                     <c ca="left">
                        <p>Sample tag</p>
                     </c>
                     <c ca="center">
                        <p>Sample ID</p>
                     </c>
                     <c ca="left">
                        <p>Mouse model</p>
                     </c>
                     <c ca="left">
                        <p>Strain</p>
                     </c>
                     <c ca="center">
                        <p>Number of fractions analyzed</p>
                     </c>
                     <c ca="left">
                        <p>Instrument</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pancreatic cancer and matched control</p>
                     </c>
                     <c ca="center">
                        <p>347</p>
                     </c>
                     <c ca="left">
                        <p>[42] Kras and INK/ARF</p>
                     </c>
                     <c ca="left">
                        <p>FVB/n</p>
                     </c>
                     <c ca="center">
                        <p>163</p>
                     </c>
                     <c ca="left">
                        <p>Thermo LTQ-FT</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Breast cancer and matched control</p>
                     </c>
                     <c ca="center">
                        <p>348</p>
                     </c>
                     <c ca="left">
                        <p>[43] Her2/Neu</p>
                     </c>
                     <c ca="left">
                        <p>FVB</p>
                     </c>
                     <c ca="center">
                        <p>144</p>
                     </c>
                     <c ca="left">
                        <p>Thermo Orbitrap</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ovarian cancer and matched control</p>
                     </c>
                     <c ca="center">
                        <p>349</p>
                     </c>
                     <c ca="left">
                        <p>[44] <it>LSL-K-ras</it><sup>G12D/+ </sup><it>Pten</it><sup>loxP/loxP</sup></p>
                     </c>
                     <c ca="left">
                        <p>LSL</p>
                     </c>
                     <c ca="center">
                        <p>144</p>
                     </c>
                     <c ca="left">
                        <p>Thermo LTQ-FT</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Colon cancer and matched control</p>
                     </c>
                     <c ca="center">
                        <p>350</p>
                     </c>
                     <c ca="left">
                        <p>[45] D580</p>
                     </c>
                     <c ca="left">
                        <p>129/B6</p>
                     </c>
                     <c ca="center">
                        <p>117</p>
                     </c>
                     <c ca="left">
                        <p>Thermo LTQ-FT</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>Each set consisted of a pool of plasma from a mouse model of cancer and its matched wild-type control.</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Database searches and building the mouse plasma PeptideAtlas</p>
            </st>
            <p>Acquired data were automatically processed through the Computational Proteomics Analysis System <abbrgrp><abbr bid="B35">35</abbr></abbrgrp> pipeline. The database search was initiated using the X!Tandem algorithm <abbrgrp><abbr bid="B12">12</abbr></abbrgrp> with the comet k-score module plug-in <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. The mouse IPI database <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>, version 3.13, was used throughout the project. All results of sequence searching were subsequently processed through PeptideProphet <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> for peptide validation and quality control, using the Trans Proteomic Pipeline <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>, version 2.9.9. All identifications with a PeptideProphet probability (P) 0.9 and above were combined to form a master list of observed peptides across all four reference sets. All experimental data were loaded into a proteomics analysis database module under the Systems Biology Experiment Analysis Management System <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. The identified peptide sequences were then mapped to the Ensembl mouse release 43 proteome based on NCBI mouse genome build 36, and the results were loaded into the PeptideAtlas relational database <abbrgrp><abbr bid="B40">40</abbr><abbr bid="B41">41</abbr></abbrgrp>.</p>
            <p>ProteinProphet <abbrgrp><abbr bid="B13">13</abbr></abbrgrp> was run on these reference data sets in a combined mode for protein identification. Proteins with less than 5% error rate from ProteinProphet were further characterized with respect to tissue expression. Mouse GNF 1M GeneAtlas, developed at the Genomics Institute of the Novartis Research Foundation <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>, was downloaded, and the tissue with the maximum expression for a given gene was assigned to that particular gene/protein. Subcellular location and major functional network categorizations were based on ingenuity pathway analysis <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Analysis of alternative splice isoforms</p>
            </st>
            <p>A target database, which had a total of 10,381,156 protein sequences, was generated <abbrgrp><abbr bid="B22">22</abbr></abbrgrp> as follows: cDNA sequences from the ECgene database <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> and from the Ensembl mouse database <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> were obtained in FASTA format; each sequence set was translated separately in 3 reading frames and the first instance of every protein sequence longer than 14 amino acids was recorded; the sequences were combined and then filtered for redundancy (preference was given to protein sequences originating from an Ensembl transcript); and a collection of common protein contaminants and reverse protein sequences was appended to the sequence database. The formatted peak list files from each dataset were searched against the target database using X!Tandem; peptides identified with an X!Tandem expect value of &lt;0.001 were extracted for further analyses.</p>
         </sec>
         <sec>
            <st>
               <p>Protein peptide identifications to determine minimal covering sets</p>
            </st>
            <p>Many transcription units produce transcripts with multiple splice isoforms that share exons. This often precludes assigning a peptide as the translation product of a specific splice isoform. To avoid redundancy in analysis, protein identifications were integrated to determine the minimum number of covering sets. A covering set is defined as a set of proteins containing all of the identified peptides. The minimal covering set is the covering set with the smallest number of members.</p>
            <p>Defining a minimal covering set is a nondeterministic polynomial-time hard (NP hard) calculation, so exact definition of the minimal covering set is not feasible for data sets of the size found in protein/peptide identifications. Instead, we employ a heuristic approach to find approximately optimal solutions. Each member of the covering set of proteins is defined by a 'lead peptide'. The minimal covering set of proteins needed to explain the observed peptide identification data was generated as follows: step 1, a list of peptides identified in all experiments was created; step 2, the peptide list was ordered by the number of spectra matching the peptide; step 3, the peptide matching the largest number of spectra was selected (the 'lead peptide'); step 4, a list of all proteins containing this peptide was generated; step 5, the protein list was sorted by the number of spectra matching peptides derived from the protein; step 6, the Ensembl protein having the largest number of matching spectra was selected (in the event of ties, the protein having the largest number of distinct peptides was selected; if there were no Ensembl proteins in the list, the splice variant with the largest number of spectra and distinct peptides was selected); step 7, all peptides contained in this protein were removed from the peptide list; step 8, the procedure was repeated beginning with step 3 until no unassigned peptides remained, thus generating a covering set of proteins that contained all of the identified peptides. Each protein in the covering set contains at least one peptide that is unique to this protein among all of the members of the covering set.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>AX, anion exchange; EGFR, epidermal growth factor receptor; IPAS, intact protein analysis system; IPI, International Protein Index; LC-MS/MS, liquid chromatography-tandem mass spectrometry; MHC, histocompatibility complex; P, probability; RP, reverse phase.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>QZ designed the study, performed data analysis, and drafted the manuscript. RM carried out the genomic data analysis and helped with the draft. EWD carried out the building of the mouse plasma PeptideAtlas and made it public. SJP, VMF, HW, and LFN performed the IPAS experiments. RAD, NB, DD, KEH, RK, TJ, and KP provided samples. RA, GSO, and DJS were involved in data analysis and helped with the draft. SMH designed the study and revised the draft. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The work was supported in part with Federal funds from the National Heart, Lung, and Blood Institute, National Institutes of Health, under contract N01-HV-28179, and National Cancer Institute, U01 (MMHCC) and P01 (PDAC).</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Chromosomally unstable mouse tumours have genomic alterations similar to diverse human cancers.</p>
            </title>
            <aug>
               <au>
                  <snm>Maser</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Choudhury</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Campbell</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>KK</fnm>
               </au>
               <au>
                  <snm>Protopopov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>O'Neil</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Gutierrez</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ivanova</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Perna</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Mani</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Jiang</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>McNamara</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Zaghlul</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Edkins</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Stevens</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Brennan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Wiedemeyer</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kabbarah</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Nogueira</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Histen</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Aster</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Mansour</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Duke</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Foroni</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Fielding</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Goldstone</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Rowe</snm>
                  <fnm>JM</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>447</volume>
            <fpage>966</fpage>
            <lpage>971</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17515920</pubid>
                  <pubid idtype="doi">10.1038/nature05886</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Identification and validation of oncogenes in liver cancer using an integrative oncogenomic approach.</p>
            </title>
            <aug>
               <au>
                  <snm>Zender</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Spector</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Xue</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Flemming</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Cordon-Cardo</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Silke</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Fan</snm>
                  <fnm>ST</fnm>
               </au>
               <au>
                  <snm>Luk</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Wigler</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hannon</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Mu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Lucito</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Powers</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>SW</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2006</pubdate>
            <volume>125</volume>
            <fpage>1253</fpage>
            <lpage>1267</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16814713</pubid>
                  <pubid idtype="doi">10.1016/j.cell.2006.05.030</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Of mice and men: cancer gene discovery using comparative oncogenomics.</p>
            </title>
            <aug>
               <au>
                  <snm>Tomlins</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Chinnaiyan</snm>
                  <fnm>AM</fnm>
               </au>
            </aug>
            <source>Cancer Cell</source>
            <pubdate>2006</pubdate>
            <volume>10</volume>
            <fpage>2</fpage>
            <lpage>4</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16843259</pubid>
                  <pubid idtype="doi">10.1016/j.ccr.2006.06.013</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Comparative oncogenomics identifies NEDD9 as a melanoma metastasis gene.</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gans</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Nogueira</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Paik</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Brennan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hahn</snm>
                  <fnm>WC</fnm>
               </au>
               <au>
                  <snm>Cordon-Cardo</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wagner</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Flotte</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Duncan</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Granter</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Chin</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2006</pubdate>
            <volume>125</volume>
            <fpage>1269</fpage>
            <lpage>1281</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16814714</pubid>
                  <pubid idtype="doi">10.1016/j.cell.2006.06.008</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>An oncogenic KRAS2 expression signature identified by cross-species gene-expression analysis.</p>
            </title>
            <aug>
               <au>
                  <snm>Sweet-Cordero</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mukherjee</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Subramanian</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>You</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Roix</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Ladd-Acosta</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mesirov</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Golub</snm>
                  <fnm>TR</fnm>
               </au>
               <au>
                  <snm>Jacks</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2005</pubdate>
            <volume>37</volume>
            <fpage>48</fpage>
            <lpage>55</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15608639</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Analysis of the mouse liver proteome using advanced mass spectrometry.</p>
            </title>
            <aug>
               <au>
                  <snm>Shi</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kumar</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Zougman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Podtelejnikov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cox</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wisniewski</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Mann</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2007</pubdate>
            <volume>6</volume>
            <fpage>2963</fpage>
            <lpage>2972</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17608399</pubid>
                  <pubid idtype="doi">10.1021/pr0605668</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Integrated pipeline for mass spectrometry-based discovery and confirmation of biomarkers demonstrated in a mouse model of breast cancer.</p>
            </title>
            <aug>
               <au>
                  <snm>Whiteaker</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Kelly-Spratt</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Ivey</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Piening</snm>
                  <fnm>BD</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>LC</fnm>
               </au>
               <au>
                  <snm>Kasarda</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Gurley</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Chodosh</snm>
                  <fnm>LA</fnm>
               </au>
               <au>
                  <snm>Kemp</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>McIntosh</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Paulovich</snm>
                  <fnm>AG</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2007</pubdate>
            <volume>6</volume>
            <fpage>3962</fpage>
            <lpage>3975</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17711321</pubid>
                  <pubid idtype="doi">10.1021/pr0604920</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Mass spectrometry-based study of the plasma proteome in a mouse intestinal tumor model.</p>
            </title>
            <aug>
               <au>
                  <snm>Hung</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Kho</snm>
                  <fnm>AT</fnm>
               </au>
               <au>
                  <snm>Sarracino</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Richard</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Krastins</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Forrester</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Haab</snm>
                  <fnm>BB</fnm>
               </au>
               <au>
                  <snm>Kohane</snm>
                  <fnm>IS</fnm>
               </au>
               <au>
                  <snm>Kucherlapati</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2006</pubdate>
            <volume>5</volume>
            <fpage>1866</fpage>
            <lpage>1878</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16889408</pubid>
                  <pubid idtype="doi">10.1021/pr060120r</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>PeptideAtlas</p>
            </title>
            <url>http://www.peptideatlas.org</url>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Empirical statistical model to estimate the accuracy of peptide identifications made by MS/MS and database search.</p>
            </title>
            <aug>
               <au>
                  <snm>Keller</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Nesvizhskii</snm>
                  <fnm>AI</fnm>
               </au>
               <au>
                  <snm>Kolker</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Aebersold</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Anal Chem</source>
            <pubdate>2002</pubdate>
            <volume>74</volume>
            <fpage>5383</fpage>
            <lpage>5392</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">12403597</pubid>
                  <pubid idtype="doi">10.1021/ac025747h</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Ensembl Mouse</p>
            </title>
            <url>http://www.ensembl.org/Mus_musculus/index.html</url>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Using annotated peptide mass spectrum libraries for protein identification.</p>
            </title>
            <aug>
               <au>
                  <snm>Craig</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Cortens</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Fenyo</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Beavis</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2006</pubdate>
            <volume>5</volume>
            <fpage>1843</fpage>
            <lpage>1849</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16889405</pubid>
                  <pubid idtype="doi">10.1021/pr0602085</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>A statistical model for identifying proteins by tandem mass spectrometry.</p>
            </title>
            <aug>
               <au>
                  <snm>Nesvizhskii</snm>
                  <fnm>AI</fnm>
               </au>
               <au>
                  <snm>Keller</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kolker</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Aebersold</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Anal Chem</source>
            <pubdate>2003</pubdate>
            <volume>75</volume>
            <fpage>4646</fpage>
            <lpage>4658</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">14632076</pubid>
                  <pubid idtype="doi">10.1021/ac0341261</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Ingenuity Pathway Analysis</p>
            </title>
            <url>http://www.ingenuity.com</url>
         </bibl>
         <bibl id="B15">
            <title>
               <p>SymAtlas</p>
            </title>
            <url>http://symatlas.gnf.org/</url>
         </bibl>
         <bibl id="B16">
            <title>
               <p>ExPASy Proteomics Server</p>
            </title>
            <url>http://au.expasy.org/uniprot/Q01279</url>
         </bibl>
         <bibl id="B17">
            <title>
               <p>GeneCard</p>
            </title>
            <url>http://www.genecards.org/cgi-bin/carddisp.pl?gene=EGFR&amp;search=egfr</url>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Cathepsin B and its role(s) in cancer progression.</p>
            </title>
            <aug>
               <au>
                  <snm>Podgorski</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Sloane</snm>
                  <fnm>BF</fnm>
               </au>
            </aug>
            <source>Biochem Soc Symp</source>
            <pubdate>2003</pubdate>
            <volume>70</volume>
            <fpage>263</fpage>
            <lpage>276</lpage>
            <xrefbib>
               <pubid idtype="pmpid">14587299</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Alternative splicing in disease and therapy.</p>
            </title>
            <aug>
               <au>
                  <snm>Garcia-Blanco</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Baraniak</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Lasda</snm>
                  <fnm>EL</fnm>
               </au>
            </aug>
            <source>Nat Biotechnol</source>
            <pubdate>2004</pubdate>
            <volume>22</volume>
            <fpage>535</fpage>
            <lpage>546</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15122293</pubid>
                  <pubid idtype="doi">10.1038/nbt964</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>The ENCODE (ENCyclopedia Of DNA Elements) Project.</p>
            </title>
            <aug>
               <au>
                  <cnm>ENCODE Project Consortium</cnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2004</pubdate>
            <volume>306</volume>
            <fpage>636</fpage>
            <lpage>640</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15499007</pubid>
                  <pubid idtype="doi">10.1126/science.1105136</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>ECgene</p>
            </title>
            <url>http://genome.ewha.ac.kr/ECgene/</url>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Novel gene and gene model detection using a whole genome open reading frame analysis in proteomics.</p>
            </title>
            <aug>
               <au>
                  <snm>Fermin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>BB</fnm>
               </au>
               <au>
                  <snm>Blackwell</snm>
                  <fnm>TW</fnm>
               </au>
               <au>
                  <snm>Menon</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Adamski</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Ulintz</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Omenn</snm>
                  <fnm>GS</fnm>
               </au>
               <au>
                  <snm>States</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>R35</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16646984</pubid>
                  <pubid idtype="doi">10.1186/gb-2006-7-4-r35</pubid>
                  <pubid idtype="pmcid">1557991</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Discovery of cancer biomarkers through the use of mouse models.</p>
            </title>
            <aug>
               <au>
                  <snm>Kuick</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Misek</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Monsma</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>CP</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>KJ</fnm>
               </au>
               <au>
                  <snm>Pisano</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Omenn</snm>
                  <fnm>GS</fnm>
               </au>
               <au>
                  <snm>Hanash</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Cancer Lett</source>
            <pubdate>2007</pubdate>
            <volume>249</volume>
            <fpage>40</fpage>
            <lpage>48</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17320282</pubid>
                  <pubid idtype="doi">10.1016/j.canlet.2006.12.032</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Altered pattern of major histocompatibility complex expression in renal carcinoma: tumor-specific expression of the nonclassical human leukocyte antigen-G molecule is restricted to clear cell carcinoma while up-regulation of other major histocompatibility complex antigens is primarily distributed in all subtypes of renal carcinoma.</p>
            </title>
            <aug>
               <au>
                  <snm>Ibrahim el</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Allory</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Commo</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Gattegno</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Callard</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Paul</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Am J Pathol</source>
            <pubdate>2003</pubdate>
            <volume>162</volume>
            <fpage>501</fpage>
            <lpage>508</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1851152</pubid>
                  <pubid idtype="pmpid" link="fulltext">12547708</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Splice variants as cancer biomarkers.</p>
            </title>
            <aug>
               <au>
                  <snm>Brinkman</snm>
                  <fnm>BM</fnm>
               </au>
            </aug>
            <source>Clin Biochem</source>
            <pubdate>2004</pubdate>
            <volume>37</volume>
            <fpage>584</fpage>
            <lpage>594</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15234240</pubid>
                  <pubid idtype="doi">10.1016/j.clinbiochem.2004.05.015</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>CD44 expression is associated with increased survival in node-negative invasive breast carcinoma.</p>
            </title>
            <aug>
               <au>
                  <snm>Diaz</snm>
                  <fnm>LK</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wright</snm>
                  <fnm>ET</fnm>
               </au>
               <au>
                  <snm>Cristofanilli</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Sneige</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sahin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gilcrease</snm>
                  <fnm>MZ</fnm>
               </au>
            </aug>
            <source>Clin Cancer Res</source>
            <pubdate>2005</pubdate>
            <volume>11</volume>
            <fpage>3309</fpage>
            <lpage>3314</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15867228</pubid>
                  <pubid idtype="doi">10.1158/1078-0432.CCR-04-2184</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Prognostic value of CD44 isoform expression in thymic epithelial neoplasms.</p>
            </title>
            <aug>
               <au>
                  <snm>Sonobe</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Miyamoto</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Nobukawa</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Izumi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Futagawa</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ishikawa</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Yamazaki</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Uekusa</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Abe</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Suda</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Cancer</source>
            <pubdate>2005</pubdate>
            <volume>103</volume>
            <fpage>2015</fpage>
            <lpage>2022</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15830350</pubid>
                  <pubid idtype="doi">10.1002/cncr.21046</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Extracellular matrix protein 1 (ECM1) is over-expressed in malignant epithelial tumors.</p>
            </title>
            <aug>
               <au>
                  <snm>Wang</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ni</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>XM</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ning</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Pei</snm>
                  <fnm>XF</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Underhill</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Liekens</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Merregaert</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Cancer Lett</source>
            <pubdate>2003</pubdate>
            <volume>200</volume>
            <fpage>57</fpage>
            <lpage>67</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">14550953</pubid>
                  <pubid idtype="doi">10.1016/S0304-3835(03)00350-1</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Contribution of protein fractionation to depth of analysis of the serum and plasma proteomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Faca</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Pitteri</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Newcomb</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Glukhova</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Phanstiel</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Krasnoselsky</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Struthers</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Fitzgibbon</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>M</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hanash</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>J Proteome Res</source>
            <pubdate>2007</pubdate>
            <volume>6</volume>
            <fpage>3558</fpage>
            <lpage>3565</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17696519</pubid>
                  <pubid idtype="doi">10.1021/pr070233q</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>A wide range of protein isoforms in serum and plasma uncovered by a quantitative intact protein analysis system.</p>
            </title>
            <aug>
               <au>
                  <snm>Misek</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Kuick</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Galchev</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Tra</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Pisano</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Amunugama</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Strahler</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Andrews</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Omenn</snm>
                  <fnm>GS</fnm>
               </au>
               <au>
                  <snm>Hanash</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Proteomics</source>
            <pubdate>2005</pubdate>
            <volume>5</volume>
            <fpage>3343</fpage>
            <lpage>3352</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16047307</pubid>
                  <pubid idtype="doi">10.1002/pmic.200500103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Gene structure prediction and alternative splicing analysis using genomically aligned ESTs.</p>
            </title>
            <aug>
               <au>
                  <snm>Kan</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Rouchka</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Gish</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>States</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2001</pubdate>
            <volume>11</volume>
            <fpage>889</fpage>
            <lpage>900</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">11337482</pubid>
                  <pubid idtype="doi">10.1101/gr.155001</pubid>
                  <pubid idtype="pmcid">311065</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Protein diversity from alternative splicing: a challenge for bioinformatics and post-genome biology.</p>
            </title>
            <aug>
               <au>
                  <snm>Black</snm>
                  <fnm>DL</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2000</pubdate>
            <volume>103</volume>
            <fpage>367</fpage>
            <lpage>370</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">11081623</pubid>
                  <pubid idtype="doi">10.1016/S0092-8674(00)00128-8</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Challenges in deriving high-confidence protein identifications from data gathered by a HUPO plasma proteome collaborative study.</p>
            </title>
            <aug>
               <au>
                  <snm>States</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Omenn</snm>
                  <fnm>GS</fnm>
               </au>
               <au>
                  <snm>Blackwell</snm>
                  <fnm>TW</fnm>
               </au>
               <au>
                  <snm>Fermin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Speicher</snm>
                  <fnm>DW</fnm>
               </au>
               <au>
                  <snm>Hanash</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Nat Biotechnol</source>
            <pubdate>2006</pubdate>
            <volume>24</volume>
            <fpage>333</fpage>
            <lpage>338</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16525410</pubid>
                  <pubid idtype="doi">10.1038/nbt1183</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Proteogenomic mapping as a complementary method to perform genome annotation.</p>
            </title>
            <aug>
               <au>
                  <snm>Jaffe</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Berg</snm>
                  <fnm>HC</fnm>
               </au>
               <au>
                  <snm>Church</snm>
                  <fnm>GM</fnm>
               </au>
            </aug>
            <source>Proteomics</source>
            <pubdate>2004</pubdate>
            <volume>4</volume>
            <fpage>59</fpage>
            <lpage>77</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">14730672</pubid>
                  <pubid idtype="doi">10.1002/pmic.200300511</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Computational Proteomics Analysis System (CPAS)</p>
            </title>
            <url>http://proteomics.fhcrc.org/CPAS/project/home/begin.view</url>
         </bibl>
         <bibl id="B36">
            <title>
               <p>General framework for developing and evaluating database scoring algorithms using the TANDEM search engine.</p>
            </title>
            <aug>
               <au>
                  <snm>Maclean</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Beavis</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>McIntosh</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <fpage>2830</fpage>
            <lpage>2832</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16877754</pubid>
                  <pubid idtype="doi">10.1093/bioinformatics/btl379</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>The International Protein Index: an integrated database for proteomics experiments.</p>
            </title>
            <aug>
               <au>
                  <snm>Kersey</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Duarte</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Karavidopoulou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Apweiler</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Proteomics</source>
            <pubdate>2004</pubdate>
            <volume>4</volume>
            <fpage>1985</fpage>
            <lpage>1988</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1002/pmic.200300721</pubid>
                  <pubid idtype="pmpid" link="fulltext">15221759</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>A uniform proteomics MS/MS analysis platform utilizing open XML file formats.</p>
            </title>
            <aug>
               <au>
                  <snm>Keller</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>XJ</fnm>
               </au>
               <au>
                  <snm>Aebersold</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Mol Syst Biol</source>
            <pubdate>2005</pubdate>
            <volume>1</volume>
            <fpage>2005.0017</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16729052</pubid>
                  <pubid idtype="doi">10.1038/msb4100024</pubid>
                  <pubid idtype="pmcid">1681455</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Systems Biology Experiment Analysis Management System (SBEAMS)</p>
            </title>
            <url>http://www.sbeams.org</url>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Integration with the human genome of peptide sequences obtained by high-throughput mass spectrometry.</p>
            </title>
            <aug>
               <au>
                  <snm>Desiere</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Deutsch</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Nesvizhskii</snm>
                  <fnm>AI</fnm>
               </au>
               <au>
                  <snm>Mallick</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>King</snm>
                  <fnm>NL</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Aderem</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Boyle</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Brunner</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Donohoe</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fausto</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Hafen</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hood</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Katze</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Kennedy</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Kregenow</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Ranish</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Rawlings</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Samelson</snm>
                  <fnm>LE</fnm>
               </au>
               <au>
                  <snm>Shiio</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Watts</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Wollscheid</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Wright</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Yi</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>H</fnm>
               </au>
               <etal/>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <fpage>R9</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15642101</pubid>
                  <pubid idtype="doi">10.1186/gb-2004-6-1-r9</pubid>
                  <pubid idtype="pmcid">549070</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>The PeptideAtlas project.</p>
            </title>
            <aug>
               <au>
                  <snm>Desiere</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Deutsch</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>King</snm>
                  <fnm>NL</fnm>
               </au>
               <au>
                  <snm>Nesvizhskii</snm>
                  <fnm>AI</fnm>
               </au>
               <au>
                  <snm>Mallick</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Eng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Eddes</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Loevenich</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Aebersold</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <issue>Database issue</issue>
            <fpage>D655</fpage>
            <lpage>D658</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16381952</pubid>
                  <pubid idtype="doi">10.1093/nar/gkj040</pubid>
                  <pubid idtype="pmcid">1347403</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Activated Kras and Ink4a/Arf deficiency cooperate to produce metastatic pancreatic ductal adenocarcinoma.</p>
            </title>
            <aug>
               <au>
                  <snm>Aguirre</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Bardeesy</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sinha</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lopez</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Tuveson</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Horner</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Redston</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>DePinho</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>2003</pubdate>
            <volume>17</volume>
            <fpage>3112</fpage>
            <lpage>3126</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">14681207</pubid>
                  <pubid idtype="doi">10.1101/gad.1158703</pubid>
                  <pubid idtype="pmcid">305262</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>Conditional activation of Neu in the mammary epithelium of transgenic mice results in reversible pulmonary metastasis.</p>
            </title>
            <aug>
               <au>
                  <snm>Moody</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Sarkisian</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Hahn</snm>
                  <fnm>KT</fnm>
               </au>
               <au>
                  <snm>Gunther</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Pickup</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dugan</snm>
                  <fnm>KD</fnm>
               </au>
               <au>
                  <snm>Innocent</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Cardiff</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Schnall</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Chodosh</snm>
                  <fnm>LA</fnm>
               </au>
            </aug>
            <source>Cancer Cell</source>
            <pubdate>2002</pubdate>
            <volume>2</volume>
            <fpage>451</fpage>
            <lpage>461</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">12498714</pubid>
                  <pubid idtype="doi">10.1016/S1535-6108(02)00212-X</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Role of K-ras and Pten in the development of mouse models of endometriosis and endometrioid ovarian cancer.</p>
            </title>
            <aug>
               <au>
                  <snm>Dinulescu</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Ince</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Quade</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Shafer</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Crowley</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Jacks</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Nat Med</source>
            <pubdate>2005</pubdate>
            <volume>11</volume>
            <fpage>63</fpage>
            <lpage>70</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">15619626</pubid>
                  <pubid idtype="doi">10.1038/nm1173</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Adenomatous polyposis coli (APC) is required for normal development of skin and thymus.</p>
            </title>
            <aug>
               <au>
                  <snm>Kuraguchi</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>XP</fnm>
               </au>
               <au>
                  <snm>Bronson</snm>
                  <fnm>RT</fnm>
               </au>
               <au>
                  <snm>Rothenberg</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ohene-Baah</snm>
                  <fnm>NY</fnm>
               </au>
               <au>
                  <snm>Lund</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Kucherlapati</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Maas</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Kucherlapati</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>PLoS Genet</source>
            <pubdate>2006</pubdate>
            <volume>2</volume>
            <fpage>e146</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">17002498</pubid>
                  <pubid idtype="doi">10.1371/journal.pgen.0020146</pubid>
                  <pubid idtype="pmcid">1564426</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
