<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-12-S5-S1</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Gene selection and classification for cancer microarray data based on machine learning and similarity measures</p>
         </title>
         <aug>
            <au id="A1"><snm>Liu</snm><fnm>Qingzhong</fnm><insr iid="I1"/><email>liu@shsu.edu</email></au>
            <au ca="yes" id="A2"><snm>Sung</snm><mi>H</mi><fnm>Andrew</fnm><insr iid="I2"/><email>sung@cs.nmt.edu</email></au>
            <au id="A3"><snm>Chen</snm><fnm>Zhongxue</fnm><insr iid="I3"/><email>zhongxue.chen@uth.tmc.edu</email></au>
            <au id="A4"><snm>Liu</snm><fnm>Jianzhong</fnm><insr iid="I4"/><email>liujzus@gmail.com</email></au>
            <au id="A5"><snm>Chen</snm><fnm>Lei</fnm><insr iid="I1"/><email>chen@shsu.edu</email></au>
            <au id="A6"><snm>Qiao</snm><fnm>Mengyu</fnm><insr iid="I5"/><email>Mengyu.Qiao@sdsmt.edu</email></au>
            <au id="A7"><snm>Wang</snm><fnm>Zhaohui</fnm><insr iid="I6"/><email>zhaohuiwang1967@gmail.com </email></au>
            <au id="A8"><snm>Huang</snm><fnm>Xudong</fnm><insr iid="I7"/><email>xhuang3@partners.org </email></au>
            <au ca="yes" id="A9"><snm>Deng</snm><fnm>Youping</fnm><insr iid="I6"/><insr iid="I8"/><email>Youping_Deng@rush.edu</email></au>
         </aug>
         <insg>
            <ins id="I1"><p>Department of Computer Science, Sam Houston State University, Huntsville, TX 77341, USA</p></ins>
            <ins id="I2"><p>Department of Computer Science and Institute of Complex Additive Systems Analysis, New Mexico Institute of Mining and Technology, Socorro, NM 87801, USA</p></ins>
            <ins id="I3"><p>Biostatistics Epidemiology Research Design Core, Center for Clinical and Translational Sciences, The University of Texas Health Science Center at Houston, Houston, TX 77030, USA</p></ins>
            <ins id="I4"><p>The Chem21 Group, Inc, 1780 Wilson Drive, Lake Forest, IL 60045, USA</p></ins>
            <ins id="I5"><p>Mathematics and Computer Science, Dept. of Mathematics &amp; Computer Science, South Dakota School of Mines &amp; Technology, Rapid City, SD 57701-3995</p></ins>
            <ins id="I6"><p>Wuhan University of Science and Technology, Wuhan, Hubei 430081, China</p></ins>
            <ins id="I7"><p>Conjugate and Medicinal Chemistry Laboratory, Division of Nuclear Medicine and Molecular Imaging, Department of Radiology, Brigham and Women's Hospital and Harvard Medical School, Boston, MA 02115, USA</p></ins>
            <ins id="I8"><p>Cancer Bioinformatics, Rush University Cancer Center, and Department of Internal Medicine, Rush University Medical Center, Chicago, IL 60612, USA</p></ins>
         </insg>
         <source>BMC Genomics</source>
         
         
         <supplement><title><p>The 2010 International Conference on Bioinformatics and Computational Biology (BIOCOMP 2010): Genomics</p></title><editor>Ke Zhang, Mehdi Pirooznia, Hamid R Arabnia</editor><note>Research</note><url>1471-2164-12-S5.pdf</url></supplement><conference><title><p>BIOCOMP 2010. The 2010 International Conference on Bioinformatics and Computational Biology</p></title><location>Las Vegas, NV, USA</location><date-range>12-15 July 2010</date-range></conference><issn>1471-2164</issn>
         <pubdate>2011</pubdate>
         <volume>12</volume>
         <issue>Suppl 5</issue>
         <fpage>S1</fpage>
         <url>http://www.biomedcentral.com/1471-2164/12/S5/S1</url>
         <xrefbib><pubidlist><pubid idtype="pmpid">22369383</pubid><pubid idtype="doi">10.1186/1471-2164-12-S5-S1</pubid></pubidlist></xrefbib>
      </bibl>
      <history><pub><date><day>23</day><month>12</month><year>2011</year></date></pub></history>
      <cpyrt><year>2011</year><collab>Liu et al. licensee BioMed Central Ltd</collab><note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note></cpyrt>
      <kwdg>
         <kwd>gene selection</kwd>
         <kwd>microarray</kwd>
         <kwd>classification</kwd>
         <kwd>supervised-learning</kwd>
         <kwd>similarity</kwd>
      </kwdg>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Microarray data have a high dimension of variables and a small sample size. In microarray data analyses, two important issues are how to choose genes, which provide reliable and good prediction for disease status, and how to determine the final gene set that is best for classification. Associations among genetic markers mean one can exploit information redundancy to potentially reduce classification cost in terms of time and money.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>To deal with redundant information and improve classification, we propose a gene selection method, Recursive Feature Addition, which combines supervised learning and statistical similarity measures. To determine the final optimal gene set for prediction and classification, we propose an algorithm, Lagging Prediction Peephole Optimization. By using six benchmark microarray gene expression data sets, we compared Recursive Feature Addition with recently developed gene selection methods: Support Vector Machine Recursive Feature Elimination, Leave-One-Out Calculation Sequential Forward Selection and several others.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>On average, with the use of popular learning machines including Nearest Mean Scaled Classifier, Support Vector Machine, Naive Bayes Classifier and Random Forest, Recursive Feature Addition outperformed other methods. Our studies also showed that Lagging Prediction Peephole Optimization is superior to random strategy; Recursive Feature Addition with Lagging Prediction Peephole Optimization obtained better testing accuracies than the gene selection method varSelRF.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Using microarrays techniques, researchers can measure the expression levels for tens of thousands of genes in a single experiment to provide scientists functional relationship information between the cellular and physiological processes of biological organisms and genes at a genome-wide level. The preprocessing procedure for the raw microarray data consists of back-ground correction, normalization, and summarization. After preprocessing, high level analyses, such as gene selection, classification, or clustering, are executed for profiling gene expression patterns <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. In the past decade, two main tracks of analyses of microarray data have been to partition genes into closely related groups across time using clustering techniques and to classify patients with different health statuses based on selected gene signatures <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr></abbrgrp>. Various standards related to systems biology are discussed by Brazma <it>et al. </it><abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. When sample sizes are substantially smaller than the number of features/genes, statistical modeling and inference issues are challenging, which is known as the "large p small n problem". Two important questions and challenges for the high dimensional data analyses are how to choose features that provide reliable and good prediction and how to determine the final optimal feature set that is best for prediction and classification.</p>
         <p>To address the "curse of dimensionality" problem, three strategies have been proposed: filtering, wrapper and embedded methods. Filtering methods select subset features independently from the learning classifiers and do not incorporate learning <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr></abbrgrp>. One of the weaknesses of filtering methods is that they only consider the individual features in isolation and ignore their possible interactions. Yet, the combination of these features may have a combined effect that does not necessarily follow from the individual performance of features in that group <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. One of the consequences of filtering methods is that we may end up with many highly correlated features/genes; this highly redundant information will worsen classification and prediction performance. Furthermore, if there is a limit on the number of features to be chosen, we may not be able to include all informative features.</p>
         <p>To avoid weakness in filtering methods, wrapper methods wrap around a particular learning algorithm that can assess the selected feature subsets in terms of estimated classification errors to build the final classifier <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. Wrapper methods use a learning machine to measure the quality of subsets of features. One recent well-known wrapper method for feature/gene selection is Support Vector Machine Recursive Feature Elimination (SVMRFE), proposed by Guyon <it>et al. </it><abbrgrp><abbr bid="B14">14</abbr></abbrgrp>, which refines the optimum feature set by using Support Vector Machine (SVM). The idea of SVMRFE is that the orientation of the separating hyper-plane found by the SVM can be used to select informative features: if the plane is orthogonal to a particular feature dimension, then that feature is informative, and vice versa. In addition to gene selection, SVMRFE has been successfully used in other feature selection and pattern classification situations <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>.</p>
         <p>Wrapper methods can noticeably reduce the number of features and significantly improve classification accuracy <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>. However, wrapper methods have the drawback of high computational load. With better computational efficiency and similar performance to wrapper methods, embedded methods process feature selection simultaneously with a learning classifier. Examples of embedded methods are LASSO <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp> and logistic regression with the regularized Laplacian prior <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>.</p>
         <p>Combining the sequential forward selection (SFS) and sequential floating forward selection (SFFS) with LS (Least Squares) Bound measure, Zhou and Mao proposed SFS-LS bound and SFFS-LS bound algorithms for optimal gene selection <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. Tang <it>et al</it>. also proposed two gene selection methods, leave-one-out calculation sequential forward selection (LOOCSFS) and the gradient based leave-one-out gene selection (GLGS) <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. Diaz-Uriarte and De Andres <abbrgrp><abbr bid="B24">24</abbr></abbrgrp> presented a new method for gene selection that uses random forest <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. The main advantage of this method is that it returns very small sets of genes that retain high predictive accuracy. The algorithms are publicized in the R package of varSelRF. Additionally, Guyon and Elisseeff elaborated a wide range of aspects in feature selection including a better definition of the objective function, feature construction, feature ranking, multivariate feature selection, efficient search methods and feature validity assessment methods <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>.</p>
         <p>In human genetic research, exploiting information redundancy from highly correlated genes may potentially reduce the cost of classification in terms of time and money. To deal with redundancy issues and to improve classification for microarray data, we designed a gene selection method recursive feature addition (RFA) in our previous work <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>, however, the optimal feature set associated with the best training was not solved. In this paper, we compare this method to SVMRFE, LOOCSFS, GLGS, SFS-LSbound, SFFS-LSbound and T-test by using six benchmark microarray data sets; meanwhile, we propose an algorithm, Lagging Prediction Peephole Optimization (LPPO), to choose the final optimal feature/gene set. We evaluate LPPO by comparing it with random strategy under the best training condition and valSelRF <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <p>Under feature dimension <it>j</it>, the training accuracy of the <it>i</it><sup>th </sup>experiment is <it>r</it>(<it>i, j</it>), and the testing accuracy of the <it>i</it><sup>th </sup>experiment is <it>s</it>(<it>i, j</it>), <it>i </it>= 1, 2,..., <it>I</it>; <it>j </it>= 1, 2,..., <it>J</it>; where <it>I </it>is the number of experiments and <it>J </it>is the number of chosen features. The average testing accuracy of the experiments under the feature dimension <it>j</it>, <it>s</it>(<it>j</it>), <it>j </it>= 1, 2,..., <it>J</it>, is calculated as follows:</p>
         <p>
            <display-formula id="M1">
               <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i1"><m:mrow>
   <m:mi>s</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>j</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mfrac>
      <m:mrow>
         <m:mn>1</m:mn>
      </m:mrow>
      <m:mrow>
         <m:mi>I</m:mi>
      </m:mrow>
   </m:mfrac>
   <m:msubsup>
      <m:mrow>
         <m:mo mathsize="big">&#8721;</m:mo>
      </m:mrow>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mn>1</m:mn>
      </m:mrow>
      <m:mrow>
         <m:mi>I</m:mi>
      </m:mrow>
   </m:msubsup>
   <m:mi>s</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>j</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
            </display-formula>
         </p>
         <p>The average testing accuracy, <it>ms_hr</it>(<it>i</it>), of the <it>i</it><sup>th </sup>experiment under the condition that the associated/corresponding training accuracy is the highest, which is defined as follows:</p>
         <p>
            <display-formula id="M2">
               <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i2"><m:mrow>
   <m:mi>m</m:mi>
   <m:mi>s</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>h</m:mi>
   <m:mi>r</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mstyle class="text">
      <m:mtext class="textsf" mathvariant="sans-serif">mean</m:mtext>
   </m:mstyle>
   <m:mfenced close=")" open="(" separators="">
      <m:mrow>
         <m:mi>s</m:mi>
         <m:mfenced close=")" open="(" separators="">
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>m</m:mi>
            </m:mrow>
         </m:mfenced>
      </m:mrow>
   </m:mfenced>
   <m:mfenced close="" open="|" separators="">
      <m:mrow>
         <m:mi>r</m:mi>
         <m:mfenced close=")" open="(" separators="">
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>m</m:mi>
            </m:mrow>
         </m:mfenced>
      </m:mrow>
   </m:mfenced>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mo class="qopname"> max</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>r</m:mi>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>j</m:mi>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mo class="MathClass-op">&#8704;</m:mo>
   <m:mi>m</m:mi>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mi>j</m:mi>
   <m:mo class="MathClass-rel">&#8712;</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">{</m:mo>
      <m:mrow>
         <m:mn>1</m:mn>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mn>2</m:mn>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:mi>J</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">}</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
            </display-formula>
         </p>
         <p>The average testing accuracy <it>ms_hr</it>(<it>i</it>) is the expected value of the random strategy under the best training classification of the <it>i</it><sup>th </sup>experiment.</p>
         <p>The highest testing accuracy, <it>hs_hr</it>(<it>i</it>), of the <it>i</it><sup>th </sup>experiment under the condition that the associated/corresponding training accuracy is the highest, which is defined as follows:</p>
         <p>
            <display-formula id="M3">
               <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i3"><m:mrow>
   <m:mi>h</m:mi>
   <m:mi>s</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>h</m:mi>
   <m:mi>r</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mstyle class="text">
      <m:mtext class="textsf" mathvariant="sans-serif">max</m:mtext>
   </m:mstyle>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>s</m:mi>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>m</m:mi>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">|</m:mo>
   <m:mi>r</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>m</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mo class="qopname"> max</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>r</m:mi>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>j</m:mi>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mo class="MathClass-op">&#8704;</m:mo>
   <m:mi>m</m:mi>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mi>j</m:mi>
   <m:mo class="MathClass-rel">&#8712;</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">{</m:mo>
      <m:mrow>
         <m:mn>1</m:mn>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mn>2</m:mn>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:mi>J</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">}</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
            </display-formula>
         </p>
         <sec>
            <st>
               <p>Average testing accuracy</p>
            </st>
            <p>Figure <figr fid="F1">1</figr> lists the average testing accuracies of the gene selection methods with classifiers NMSC, SVM, NBC, and RF. Again, the performances of NBC-MMC, NMSC-MMC, NBC-MSC, and NMSC-MSC are close to one another; therefore, the average testing accuracies of the gene selection methods NBC-MMC, NMSC-MMC, and NBC-MSC are not listed in the figures. It indicates that the average testing accuracy of NMSC-MSC is the best, followed by GLGS, LOOCSFS, and SVM-RFE. SFS-LS bound, SFFS-LS bound, and T-TEST did not perform well. Figure <figr fid="F1">1</figr> also demonstrates that, spanning several data sets and learning classifiers, the performance and stabilization of the gene selection method of NMSC-MSC is the best.</p>
            <fig id="F1"><title><p>Figure 1</p></title><caption><p>The average testing accuracies of different gene selection methods for six benchmark data sets by using the classifiers (NBC, NMSC, SVM, RF)</p></caption><text>
   <p><b>The average testing accuracies of different gene selection methods for six benchmark data sets by using the classifiers (NBC, NMSC, SVM, RF)</b>. X-axis and y-axis give the feature dimension and testing accuracy values, respectively.</p>
</text><graphic file="1471-2164-12-S5-S1-1"/></fig>
         </sec>
         <sec>
            <st>
               <p>Testing results under the best training</p>
            </st>
            <p>Table <tblr tid="T1">1</tblr> provides the mean values and standard errors of the testing accuracies ms_hr(i), (i = 1, 2,..., 20) and the highest testing accuracies hs_hr(i), (i = 1, 2, ..., 20) under the highest training classification, respectively. After applying each classifier to each data set, the highest mean value of the ten gene selection methods is shaded. In each data set, the highest mean value in the shade is in bold. With the use of the four learning classifiers, under the best training, RFA, GLGS, LOOCSFS, SVMRFE, SFS-LSBOUND, SFFS-LSBOUND, and T-test respectively achieve the highest testing accuracies (HS_HR), 99.9%, 99.6%, 99.3%, 98.0%, 97.4%, 97.3%, and 96.8% for the leukemia data set; 99.5%, 98.6%, 93.0%, 99.2%, 95.1%, 96.1%, and 94.4% for lymphoma; 96.9%, 96.1%, 95.2%, 95.7%, 93.4%, 92.7%, and 94.0% for prostate; 91.1%, 90.5%, 86.8%, 86.8%, 87.1%, 86.0%, and 85.5% for colon; 94.0%, 91.1%, 85.0%, 85.1%, 76.2%, 76.2%, and 77.4% for CNS; and 85.9%, 83.7%, 80.3%, 80.4%, 81.5%, 81.3%, and 77.6% for the breast cancer data set. In applying the ten gene selection methods to the six benchmark data sets, all the highest testing accuracies are obtained from the gene set chosen by RFA.</p>
            <tbl id="T1"><title><p>Table 1</p></title><caption><p>Mean values and standard errors of hs_hr and ms_hr.</p></caption><tblbdy cols="10">
      <r>
         <c ca="center">
            <p>
               <b>DATA SET</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>GENE SELECTION METHOD</b>
            </p>
         </c>
         <c ca="center" cspan="4">
            <p>
               <b>MEAN(HS_HR) &#177; STD(HS_HR), %</b>
            </p>
         </c>
         <c ca="center" cspan="4">
            <p>
               <b>MEAN(MS_HR) &#177; STD(MS_HR), %</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c cspan="8">
            <hr/>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>
               <b>NMSC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>SVM</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>NBC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>RF</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>NMSC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>SVM</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>NBC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>RF</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Leukemia</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>
               <b>99.9 &#177; 0.6</b>
            </p>
         </c>
         <c ca="center">
            <p>99.4 &#177; 1.2</p>
         </c>
         <c ca="center">
            <p>98.3 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>98.4 &#177; 1.4</p>
         </c>
         <c ca="center">
            <p>98.1 &#177; 1.4</p>
         </c>
         <c ca="center">
            <p>93.4 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>94.3 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>95.6 &#177; 2.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>
               <b>99.9 &#177; 0.6</b>
            </p>
         </c>
         <c ca="center">
            <p>99.1 &#177; 1.3</p>
         </c>
         <c ca="center">
            <p>98.4 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>98.6 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>97.9 &#177; 1.2</p>
         </c>
         <c ca="center">
            <p>93.3 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>95.2 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>95.7 &#177; 3.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>99.4 &#177; 1.1</p>
         </c>
         <c ca="center">
            <p>99.1 &#177; 1.3</p>
         </c>
         <c ca="center">
            <p>
               <b>98.9 &#177; 1.4</b>
            </p>
         </c>
         <c ca="center">
            <p>98.4 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>
               <b>98.5 &#177; 1.6</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>94.9 &#177; 2.7</b>
            </p>
         </c>
         <c ca="center">
            <p>94.6 &#177; 2.7</p>
         </c>
         <c ca="center">
            <p>96.0 &#177; 2.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>99.7 &#177; 0.9</p>
         </c>
         <c ca="center">
            <p>
               <b>99.6 &#177; 1.0</b>
            </p>
         </c>
         <c ca="center">
            <p>98.6 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>98.7 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>97.7 &#177; 1.4</p>
         </c>
         <c ca="center">
            <p>94.8 &#177; 2.5</p>
         </c>
         <c ca="center">
            <p>94.6 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>95.7 &#177; 3.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>99.6 &#177; 1.0</p>
         </c>
         <c ca="center">
            <p>98.9 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>98.6 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>98.6 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>97.8 &#177; 1.7</p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>
               <b>95.3 &#177; 1.8</b>
            </p>
         </c>
         <c ca="center">
            <p>95.0 &#177; 2.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>97.1 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>98.0 &#177; 1.5</p>
         </c>
         <c ca="center">
            <p>97.7 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>
               <b>99.3 &#177; 1.2</b>
            </p>
         </c>
         <c ca="center">
            <p>93.9 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>94.8 &#177; 3.1</p>
         </c>
         <c ca="center">
            <p>94.5 &#177; 2.7</p>
         </c>
         <c ca="center">
            <p>
               <b>96.7 &#177; 1.6</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>98.0 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>95.4 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>97.3 &#177; 2.1</p>
         </c>
         <c ca="center">
            <p>98.0 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>95.7 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>93.4 &#177; 1.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>97.1 &#177; 2.5</p>
         </c>
         <c ca="center">
            <p>97.4 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>96.3 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>97.1 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>93.8 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>92.9 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>90.2 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>92.6 &#177; 4.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>97.1 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>97.0 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>96.4 &#177; 3.6</p>
         </c>
         <c ca="center">
            <p>97.3 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>94.6 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>93.6 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>91.2 &#177; 5.0</p>
         </c>
         <c ca="center">
            <p>93.0 &#177; 5.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>94.8 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>95.4 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>93.3 &#177; 6.9</p>
         </c>
         <c ca="center">
            <p>96.8 &#177; 2.9</p>
         </c>
         <c ca="center">
            <p>92.2 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>90.7 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>90.1 &#177; 6.5</p>
         </c>
         <c ca="center">
            <p>93.5 &#177; 3.6</p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Lymphoma</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>98.1 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>
               <b>99.0 &#177; 1.3</b>
            </p>
         </c>
         <c ca="center">
            <p>97.3 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>96.4 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>96.2 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>93.8 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>91.7 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>91.6 &#177; 3.7</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>99.2 &#177; 1.2</p>
         </c>
         <c ca="center">
            <p>98.8 &#177; 1.6</p>
         </c>
         <c ca="center">
            <p>97.9 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>96.5 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>96.9 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>93.0 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>93.1 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>92.3 &#177; 4.0</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>99.4 &#177; 1.1</p>
         </c>
         <c ca="center">
            <p>98.4 &#177; 1.8</p>
         </c>
         <c ca="center">
            <p>97.9 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>96.8 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>
               <b>97.5 &#177; 1.9</b>
            </p>
         </c>
         <c ca="center">
            <p>93.1 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>92.7 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>92.6 &#177; 4.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>
               <b>99.5 &#177; 1.1</b>
            </p>
         </c>
         <c ca="center">
            <p>98.8 &#177; 1.6</p>
         </c>
         <c ca="center">
            <p>
               <b>98.1 &#177; 2.0</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>97.0 &#177; 3.6</b>
            </p>
         </c>
         <c ca="center">
            <p>97.2 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>
               <b>93.9 &#177; 3.0</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>93.9 &#177; 3.1</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>93.4 &#177; 3.9</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>98.6 &#177; 1.8</p>
         </c>
         <c ca="center">
            <p>98.2 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>97.0 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>96.9 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>96.5 &#177; 2.1</p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>92.3 &#177; 3.6</p>
         </c>
         <c ca="center">
            <p>91.7 &#177; 2.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>87.0 &#177; 7.2</p>
         </c>
         <c ca="center">
            <p>93.0 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>87.3 &#177; 5.1</p>
         </c>
         <c ca="center">
            <p>92.9 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>85.8 &#177; 6.8</p>
         </c>
         <c ca="center">
            <p>87.8 &#177; 5.4</p>
         </c>
         <c ca="center">
            <p>85.1 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>88.2 &#177; 4.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>99.2 &#177; 1.5</p>
         </c>
         <c ca="center">
            <p>96.5 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>97.2 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>96.6 &#177; 3.1</p>
         </c>
         <c ca="center">
            <p>96.5 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>91.8 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>93.1 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>93.3 &#177; 4.0</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>88.7 &#177; 6.1</p>
         </c>
         <c ca="center">
            <p>95.1 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>84.0 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>92.2 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>87.0 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>88.2 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>80.6 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>86.8 &#177; 4.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>87.7 &#177; 6.1</p>
         </c>
         <c ca="center">
            <p>96.1 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>86.1 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>91.8 &#177; 4.2</p>
         </c>
         <c ca="center">
            <p>86.4 &#177; 5.6</p>
         </c>
         <c ca="center">
            <p>91.1 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>82.7 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>86.1 &#177; 4.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>86.0 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>94.4 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>86.5 &#177; 7.0</p>
         </c>
         <c ca="center">
            <p>91.7 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>84.3 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>87.7 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>83.9 &#177; 6.1</p>
         </c>
         <c ca="center">
            <p>87.2 &#177; 4.5</p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Prostate</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>96.3 &#177; 2.4</p>
         </c>
         <c ca="center">
            <p>95.8 &#177; 2.5</p>
         </c>
         <c ca="center">
            <p>94.8 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>
               <b>96.5 &#177; 2.0</b>
            </p>
         </c>
         <c ca="center">
            <p>94.2 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>91.6 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>90.4 &#177; 2.7</p>
         </c>
         <c ca="center">
            <p>92.1 &#177; 2.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>95.6 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>95.9 &#177; 2.5</p>
         </c>
         <c ca="center">
            <p>93.7 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>95.3 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>92.7 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>91.4 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>90.7 &#177; 3.1</p>
         </c>
         <c ca="center">
            <p>91.3 &#177; 2.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>96.4 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>96.6 &#177; 1.9</p>
         </c>
         <c ca="center">
            <p>
               <b>95.2 &#177; 2.1</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>96.5 &#177; 1.9</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>94.6 &#177; 2.3</b>
            </p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>91.0 &#177; 2.3</p>
         </c>
         <c ca="center">
            <p>
               <b>92.5 &#177; 2.2</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>
               <b>96.9 &#177; 2.3</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>96.7 &#177; 1.7</b>
            </p>
         </c>
         <c ca="center">
            <p>94.5 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>95.8 &#177; 1.8</p>
         </c>
         <c ca="center">
            <p>94.5 &#177; 2.4</p>
         </c>
         <c ca="center">
            <p>
               <b>92.8 &#177; 1.9</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>91.8 &#177; 2.5</b>
            </p>
         </c>
         <c ca="center">
            <p>92.0 &#177; 1.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>93.6 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>96.1 &#177; 2.2</p>
         </c>
         <c ca="center">
            <p>90.4 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>94.7 &#177; 2.0</p>
         </c>
         <c ca="center">
            <p>91.5 &#177; 2.7</p>
         </c>
         <c ca="center">
            <p>91.7 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>87.5 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 2.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>88.4 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>94.9 &#177; 2.9</p>
         </c>
         <c ca="center">
            <p>90.7 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>95.2 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>87.0 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>91.1 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>88.0 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>92.3 &#177; 2.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>94.1 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>92.3 &#177; 2.7</p>
         </c>
         <c ca="center">
            <p>92.8 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>95.7 &#177; 2.6</p>
         </c>
         <c ca="center">
            <p>92.4 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>86.7 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>
               <b>92.5 &#177; 2.8</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>90.4 &#177; 3.2</p>
         </c>
         <c ca="center">
            <p>93.4 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>86.2 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>90.2 &#177; 3.2</p>
         </c>
         <c ca="center">
            <p>88.9 &#177; 3.1</p>
         </c>
         <c ca="center">
            <p>86.0 &#177; 3.2</p>
         </c>
         <c ca="center">
            <p>84.4 &#177; 5.1</p>
         </c>
         <c ca="center">
            <p>86.1 &#177; 4.0</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>89.7 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>92.7 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>87.3 &#177; 5.4</p>
         </c>
         <c ca="center">
            <p>92.4 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>88.3 &#177; 5.1</p>
         </c>
         <c ca="center">
            <p>87.2 &#177; 5.0</p>
         </c>
         <c ca="center">
            <p>85.1 &#177; 5.4</p>
         </c>
         <c ca="center">
            <p>89.0 &#177; 3.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>91.4 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>92.5 &#177; 2.1</p>
         </c>
         <c ca="center">
            <p>91.7 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>94.0 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>89.7 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>87.1 &#177; 3.2</p>
         </c>
         <c ca="center">
            <p>89.0 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>91.0 &#177; 3.1</p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Colon</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>88.7 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>
               <b>87.7 &#177; 5.2</b>
            </p>
         </c>
         <c ca="center">
            <p>86.5 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>89.7 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>84.5 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>80.9 &#177; 6.0</p>
         </c>
         <c ca="center">
            <p>78.2 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>82.5 &#177; 5.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>
               <b>91.1 &#177; 5.0</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>87.7 &#177; 3.9</b>
            </p>
         </c>
         <c ca="center">
            <p>87.4 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>84.9 &#177; 7.1</p>
         </c>
         <c ca="center">
            <p>
               <b>81.3 &#177; 5.5</b>
            </p>
         </c>
         <c ca="center">
            <p>80.8 &#177; 5.9</p>
         </c>
         <c ca="center">
            <p>83.3 &#177; 5.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>89.4 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>86.9 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>
               <b>88.7 &#177; 6.0</b>
            </p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>
               <b>86.0 &#177; 5.2</b>
            </p>
         </c>
         <c ca="center">
            <p>80.3 &#177; 5.6</p>
         </c>
         <c ca="center">
            <p>82.1 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>
               <b>84.4 &#177; 4.7</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>91.0 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>87.6 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>88.1 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>
               <b>86.0 &#177; 5.4</b>
            </p>
         </c>
         <c ca="center">
            <p>80.9 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>
               <b>82.6 &#177; 4.0</b>
            </p>
         </c>
         <c ca="center">
            <p>83.9 &#177; 4.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>87.3 &#177; 6.2</p>
         </c>
         <c ca="center">
            <p>87.3 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>85.2 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>
               <b>90.5 &#177; 4.3</b>
            </p>
         </c>
         <c ca="center">
            <p>83.7 &#177; 6.6</p>
         </c>
         <c ca="center">
            <p>81.2 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>77.6 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>83.0 &#177; 4.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>85.0 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>86.3 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>81.6 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>86.8 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>82.2 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>79.3 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>76.7 &#177; 6.9</p>
         </c>
         <c ca="center">
            <p>80.3 &#177; 5.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>86.0 &#177; 6.7</p>
         </c>
         <c ca="center">
            <p>86.8 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>82.1 &#177; 7.4</p>
         </c>
         <c ca="center">
            <p>86.3 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>81.8 &#177; 7.2</p>
         </c>
         <c ca="center">
            <p>80.7 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>77.7 &#177; 7.5</p>
         </c>
         <c ca="center">
            <p>80.3 &#177; 6.0</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>85.0 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>87.1 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>72.7 &#177; 7.0</p>
         </c>
         <c ca="center">
            <p>82.6 &#177; 6.0</p>
         </c>
         <c ca="center">
            <p>82.4 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>76.2 &#177; 6.3</p>
         </c>
         <c ca="center">
            <p>69.5 &#177; 8.3</p>
         </c>
         <c ca="center">
            <p>74.6 &#177; 6.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>85.3 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>85.8 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>76.8 &#177; 7.1</p>
         </c>
         <c ca="center">
            <p>86.0 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>83.3 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>77.7 &#177; 6.4</p>
         </c>
         <c ca="center">
            <p>72.5 &#177; 6.2</p>
         </c>
         <c ca="center">
            <p>77.6 &#177; 4.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>77.4 &#177; 10.4</p>
         </c>
         <c ca="center">
            <p>85.5 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>76.3 &#177; 8.3</p>
         </c>
         <c ca="center">
            <p>81.5 &#177; 7.2</p>
         </c>
         <c ca="center">
            <p>74.9 &#177; 10.8</p>
         </c>
         <c ca="center">
            <p>75.3 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>72.8 &#177; 8.2</p>
         </c>
         <c ca="center">
            <p>75.1 &#177; 7.8</p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>CNS</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>91.8 &#177; 6.1</p>
         </c>
         <c ca="center">
            <p>
               <b>92.9 &#177; 3.6</b>
            </p>
         </c>
         <c ca="center">
            <p>77.8 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>
               <b>85.7 &#177; 4.0</b>
            </p>
         </c>
         <c ca="center">
            <p>86.7 &#177; 6.0</p>
         </c>
         <c ca="center">
            <p>82.4 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>67.3 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>
               <b>76.3 &#177; 4.0</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>90.0 &#177; 6.4</p>
         </c>
         <c ca="center">
            <p>92.2 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>78.0 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>82.7 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>82.8 &#177; 6.8</p>
         </c>
         <c ca="center">
            <p>82.1 &#177; 5.6</p>
         </c>
         <c ca="center">
            <p>67.5 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>73.5 &#177; 4.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>
               <b>94.0 &#177; 4.6</b>
            </p>
         </c>
         <c ca="center">
            <p>92.0 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>81.1 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>85.5 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>
               <b>88.4 &#177; 5.2</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>82.6 &#177; 5.5</b>
            </p>
         </c>
         <c ca="center">
            <p>70.2 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>75.9 &#177; 5.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>92.8 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>91.6 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>
               <b>81.3 &#177; 6.1</b>
            </p>
         </c>
         <c ca="center">
            <p>84.9 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>85.6 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>81.4 &#177; 6.2</p>
         </c>
         <c ca="center">
            <p>70.0 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>74.4 &#177; 4.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>84.7 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>91.1 &#177; 5.4</p>
         </c>
         <c ca="center">
            <p>78.8 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>84.2 &#177; 5.0</p>
         </c>
         <c ca="center">
            <p>82.4 &#177; 3.6</p>
         </c>
         <c ca="center">
            <p>81.3 &#177; 4.8</p>
         </c>
         <c ca="center">
            <p>67.9 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>75.3 &#177; 4.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>71.3 &#177; 9.8</p>
         </c>
         <c ca="center">
            <p>85.0 &#177; 5.9</p>
         </c>
         <c ca="center">
            <p>79.1 &#177; 7.7</p>
         </c>
         <c ca="center">
            <p>83.2 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>69.3 &#177; 8.0</p>
         </c>
         <c ca="center">
            <p>77.6 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>
               <b>71.8 &#177; 6.2</b>
            </p>
         </c>
         <c ca="center">
            <p>75.3 &#177; 5.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>83.2 &#177; 8.9</p>
         </c>
         <c ca="center">
            <p>85.1 &#177; 8.4</p>
         </c>
         <c ca="center">
            <p>77.1 &#177; 6.8</p>
         </c>
         <c ca="center">
            <p>83.5 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>77.0 &#177; 8.0</p>
         </c>
         <c ca="center">
            <p>75.0 &#177; 8.8</p>
         </c>
         <c ca="center">
            <p>65.7 &#177; 7.2</p>
         </c>
         <c ca="center">
            <p>73.3 &#177; 4.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>68.1 &#177; 6.7</p>
         </c>
         <c ca="center">
            <p>71.9 &#177; 7.1</p>
         </c>
         <c ca="center">
            <p>67.6 &#177; 7.7</p>
         </c>
         <c ca="center">
            <p>76.2 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>65.3 &#177; 6.3</p>
         </c>
         <c ca="center">
            <p>59.4 &#177; 7.5</p>
         </c>
         <c ca="center">
            <p>61.3 &#177; 6.1</p>
         </c>
         <c ca="center">
            <p>66.9 &#177; 4.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>67.8 &#177; 6.2</p>
         </c>
         <c ca="center">
            <p>72.4 &#177; 4.9</p>
         </c>
         <c ca="center">
            <p>69.8 &#177; 8.2</p>
         </c>
         <c ca="center">
            <p>76.2 &#177; 5.0</p>
         </c>
         <c ca="center">
            <p>65.7 &#177; 5.4</p>
         </c>
         <c ca="center">
            <p>60.7 &#177; 5.1</p>
         </c>
         <c ca="center">
            <p>63.7 &#177; 7.2</p>
         </c>
         <c ca="center">
            <p>68.4 &#177; 4.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>67.5 &#177; 8.8</p>
         </c>
         <c ca="center">
            <p>77.4 &#177; 6.4</p>
         </c>
         <c ca="center">
            <p>67.0 &#177; 7.1</p>
         </c>
         <c ca="center">
            <p>75.5 &#177; 5.9</p>
         </c>
         <c ca="center">
            <p>63.4 &#177; 7.6</p>
         </c>
         <c ca="center">
            <p>67.3 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>60.9 &#177; 6.8</p>
         </c>
         <c ca="center">
            <p>67.8 &#177; 4.9</p>
         </c>
      </r>
      <r>
         <c cspan="10">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Breast</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>82.5 &#177; 6.0</p>
         </c>
         <c ca="center">
            <p>82.9 &#177; 3.5</p>
         </c>
         <c ca="center">
            <p>84.1 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>84.1 &#177; 3.6</p>
         </c>
         <c ca="center">
            <p>81.3 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>73.2 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>78.4 &#177; 3.4</p>
         </c>
         <c ca="center">
            <p>78.4 &#177; 3.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>
               <b>83.9 &#177; 4.6</b>
            </p>
         </c>
         <c ca="center">
            <p>82.0 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>82.4 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>83.7 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>80.4 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>72.0 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>78.4 &#177; 4.3</p>
         </c>
         <c ca="center">
            <p>77.0 &#177; 4.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>83.4 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>
               <b>83.5 &#177; 3.8</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>85.8 &#177; 3.1</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>85.9 &#177; 4.7</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>81.5 &#177; 5.3</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>74.9 &#177; 3.3</b>
            </p>
         </c>
         <c ca="center">
            <p>79.1 &#177; 3.0</p>
         </c>
         <c ca="center">
            <p>
               <b>79.4 &#177; 4.1</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>82.8 &#177; 4.4</p>
         </c>
         <c ca="center">
            <p>82.4 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>84.1 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>83.9 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>79.6 &#177; 4.0</p>
         </c>
         <c ca="center">
            <p>73.7 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>
               <b>79.2 &#177; 3.8</b>
            </p>
         </c>
         <c ca="center">
            <p>77.7 &#177; 4.0</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>80.8 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>79.3 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>81.4 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>83.7 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>79.2 &#177; 3.9</p>
         </c>
         <c ca="center">
            <p>70.7 &#177; 4.6</p>
         </c>
         <c ca="center">
            <p>77.8 &#177; 3.7</p>
         </c>
         <c ca="center">
            <p>77.0 &#177; 4.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>71.7 &#177; 6.5</p>
         </c>
         <c ca="center">
            <p>77.3 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>78.0 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>80.3 &#177; 3.8</p>
         </c>
         <c ca="center">
            <p>70.4 &#177; 6.5</p>
         </c>
         <c ca="center">
            <p>69.2 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>74.7 &#177; 5.1</p>
         </c>
         <c ca="center">
            <p>74.3 &#177; 4.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>74.3 &#177; 7.1</p>
         </c>
         <c ca="center">
            <p>78.3 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>77.2 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>80.4 &#177; 4.1</p>
         </c>
         <c ca="center">
            <p>73.2 &#177; 6.6</p>
         </c>
         <c ca="center">
            <p>72.1 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>73.9 &#177; 4.5</p>
         </c>
         <c ca="center">
            <p>73.9 &#177; 3.7</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>76.2 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>78.9 &#177; 2.8</p>
         </c>
         <c ca="center">
            <p>76.9 &#177; 7.3</p>
         </c>
         <c ca="center">
            <p>81.5 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>75.0 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>67.8 &#177; 3.3</p>
         </c>
         <c ca="center">
            <p>75.2 &#177; 6.8</p>
         </c>
         <c ca="center">
            <p>75.6 &#177; 4.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>77.5 &#177; 5.6</p>
         </c>
         <c ca="center">
            <p>78.9 &#177; 4.2</p>
         </c>
         <c ca="center">
            <p>79.8 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>81.3 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>75.8 &#177; 5.5</p>
         </c>
         <c ca="center">
            <p>68.0 &#177; 4.7</p>
         </c>
         <c ca="center">
            <p>76.9 &#177; 6.3</p>
         </c>
         <c ca="center">
            <p>75.4 &#177; 5.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>71.1 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>77.6 &#177; 5.2</p>
         </c>
         <c ca="center">
            <p>72.6 &#177; 6.3</p>
         </c>
         <c ca="center">
            <p>76.3 &#177; 5.7</p>
         </c>
         <c ca="center">
            <p>69.3 &#177; 5.3</p>
         </c>
         <c ca="center">
            <p>69.9 &#177; 3.6</p>
         </c>
         <c ca="center">
            <p>70.5 &#177; 5.8</p>
         </c>
         <c ca="center">
            <p>71.1 &#177; 5.8</p>
         </c>
      </r>
   </tblbdy><tblfn>
      <p>In each data set, the highest mean value is highlighted in bold</p>
   </tblfn></tbl>
            <p>Table <tblr tid="T2">2</tblr> lists the number of occurrences for each gene selection method that achieved the best testing accuracy. Table <tblr tid="T2">2</tblr> shows that 61 out of 67 highest mean values were obtained by MMC- or MSC-based methods; GLGS, LOOCSFS, and SVMRFE obtained the best twice, three times, and once, respectively; LSBOUND and T-TEST never got the best value. Results indicate that RFA outperforms other gene selection methods.</p>
            <tbl id="T2"><title><p>Table 2</p></title><caption><p>The number of occurrences of the best testing in Table 1</p></caption><tblbdy cols="5">
      <r>
         <c ca="center">
            <p>
               <b>Gene</b>
            </p>
            <p>
               <b>Selection</b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b># Best testing accumulated with each classifier     </b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b># Best testing among the four classifiers</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c cspan="4">
            <hr/>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="5">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>6</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>4</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>2</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>8</p>
         </c>
         <c ca="center">
            <p>12</p>
         </c>
         <c ca="center">
            <p>2</p>
         </c>
         <c ca="center">
            <p>6</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>7</p>
         </c>
         <c ca="center">
            <p>8</p>
         </c>
         <c ca="center">
            <p>2</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>2</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>1</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
         <c ca="center">
            <p>0</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Total</p>
         </c>
         <c ca="center">
            <p>27</p>
         </c>
         <c ca="center">
            <p>26</p>
         </c>
         <c ca="center">
            <p>7</p>
         </c>
         <c ca="center">
            <p>7</p>
         </c>
      </r>
   </tblbdy></tbl>
            <p>On the other side, to see whether the new methods are superior to others, regression models were built based on average testing accuracy (ms_hr) and highest testing accuracy (hs_hr), respectively, with data set (six benchmark microarray data set), gene selection method (four new methods and six other methods) and classifier (four classification methods) as independent variables. After adjusting data set effect and classifier effect, the main effects for the new feature selection methods (NBC-MMC, NMSC-MMC, NBC-MSC, and NMSC-MSC) and others (GLGS, LOOCSFS, SVMRFE, SFS-LSBOUND, SFFS-LSBOUND, and T-test) are 91.86%, 91.67%, 92.47%, 92.27%, 90.65%, 86.96%, 88.89%, 84.70%, 85.38%, and 83.93% for the highest testing accuracy, and 86.38%, 86.15%, 87.30%, 86.97%, 85.48%, 82.76%, 83.96%, 79.45%, 80.58%, and 79.36% for the average testing accuracy, respectively. Table <tblr tid="T3">3</tblr> gives the p-values of testing superiority of each new method to other six methods, which are calculated based on one-tailed t-test from the output of the regression models. From the p-values, the performances of our new methods are statistically significantly better than all other methods (most p-values are &lt;0.0001) except for GLGS. From Table <tblr tid="T3">3</tblr> MSC-based methods (NBC-MSC, NMSC-MSC) are significantly better than GLGS based on both highest testing accuracy and average testing accuracy at a significance level of 0.05. Although the p-values for NBC-MMC and NMSC-MMC to GLGS are not small enough due to the small sample size (only six testing data sets) and therefore lower power, we would expect that the differences will be detected at lower significance levels if more data sets are used. To see whether the four new gene methods perform differently, we also test each pair of the four methods and calculate the p-values based on two-tailed t-test from the output of the regression models. All the p-values are bigger than 0.2, so the four new methods perform equally well.</p>
            <tbl id="T3"><title><p>Table 3</p></title><caption><p>P-values from testing superiority of new methods to others</p></caption><tblbdy cols="9">
      <r>
         <c ca="center">
            <p>
               <b>Method</b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b>NBC-MMC</b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b>NMSC-MMC</b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b>NBC-MSC</b>
            </p>
         </c>
         <c ca="center" cspan="2">
            <p>
               <b>NMSC-MSC</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c cspan="8">
            <hr/>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>HS_HR</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>MS_HR</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="9">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>GLGS</p>
         </c>
         <c ca="center">
            <p>0.092</p>
         </c>
         <c ca="center">
            <p>0.15</p>
         </c>
         <c ca="center">
            <p>0.13</p>
         </c>
         <c ca="center">
            <p>0.22</p>
         </c>
         <c ca="center">
            <p>0.023</p>
         </c>
         <c ca="center">
            <p>0.0212</p>
         </c>
         <c ca="center">
            <p>0.038</p>
         </c>
         <c ca="center">
            <p>0.048</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>LOOCSFS</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SVMRFE</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>0.0077</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>0.0004</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SFFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>SFS-LSBOUND</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>T-TEST</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="center">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
         <c ca="left">
            <p>&lt;0.0001</p>
         </c>
      </r>
   </tblbdy></tbl>
         </sec>
         <sec>
            <st>
               <p>Comparison of LPPO and random strategy</p>
            </st>
            <p>Table <tblr tid="T4">4</tblr> lists the mean values of the differences between the testing values (denoted as S_LPPO) by applying NMSC, SVM, NBC, and RF to LPPO and ms_hr. This table shows that, on average, LPPO is superior to the random strategy under the best training accuracies. In summary, spanning the six benchmark data sets, in comparison with ms_hr, LPPO improves the testing accuracy by 0.8% for NMSC, 0.7% for SVM, 0.4% for NBC, and 0.9% for RF on average.</p>
            <tbl id="T4"><title><p>Table 4</p></title><caption><p>Comparison of LPPO and Random Strategy</p></caption><tblbdy cols="6">
      <r>
         <c ca="center">
            <p>
               <b>Data</b>
            </p>
            <p>
               <b>Set</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>Gene</b>
            </p>
            <p>
               <b>Selection</b>
            </p>
         </c>
         <c ca="center" cspan="4">
            <p>
               <b>MEAN(S_LPPO - MS_HR), %</b>
            </p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c cspan="4">
            <hr/>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>
               <b>NMSC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>SVM</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>NBC</b>
            </p>
         </c>
         <c ca="center">
            <p>
               <b>RF</b>
            </p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Leukemia</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>0.8</p>
         </c>
         <c ca="center">
            <p>-0.1</p>
         </c>
         <c ca="center">
            <p>2.3</p>
         </c>
         <c ca="center">
            <p>1.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>1.0</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
         <c ca="center">
            <p>1.8</p>
         </c>
         <c ca="center">
            <p>1.6</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>-0.2</p>
         </c>
         <c ca="center">
            <p>0.3</p>
         </c>
         <c ca="center">
            <p>1.9</p>
         </c>
         <c ca="center">
            <p>1.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>1.6</p>
         </c>
         <c ca="center">
            <p>0.7</p>
         </c>
         <c ca="center">
            <p>2.5</p>
         </c>
         <c ca="center">
            <p>1.3</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Lymphoma</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
         <c ca="center">
            <p>0.1</p>
         </c>
         <c ca="center">
            <p>-1.0</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>1.3</p>
         </c>
         <c ca="center">
            <p>-0.4</p>
         </c>
         <c ca="center">
            <p>1.4</p>
         </c>
         <c ca="center">
            <p>1.2</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
         <c ca="center">
            <p>1.2</p>
         </c>
         <c ca="center">
            <p>1.5</p>
         </c>
         <c ca="center">
            <p>1.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
         <c ca="center">
            <p>0.1</p>
         </c>
         <c ca="center">
            <p>1.6</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Prostate</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>0.2</p>
         </c>
         <c ca="center">
            <p>0.1</p>
         </c>
         <c ca="center">
            <p>0.0</p>
         </c>
         <c ca="center">
            <p>0.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
         <c ca="center">
            <p>1.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>0.3</p>
         </c>
         <c ca="center">
            <p>0.7</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
         <c ca="center">
            <p>1.8</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
         <c ca="center">
            <p>0.8</p>
         </c>
         <c ca="center">
            <p>0.2</p>
         </c>
         <c ca="center">
            <p>1.0</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Colon</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>0.3</p>
         </c>
         <c ca="center">
            <p>0.2</p>
         </c>
         <c ca="center">
            <p>-1.1</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
         <c ca="center">
            <p>0.0</p>
         </c>
         <c ca="center">
            <p>0.1</p>
         </c>
         <c ca="center">
            <p>0.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>-0.2</p>
         </c>
         <c ca="center">
            <p>-0.5</p>
         </c>
         <c ca="center">
            <p>-2.6</p>
         </c>
         <c ca="center">
            <p>-1.3</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
         <c ca="center">
            <p>0.3</p>
         </c>
         <c ca="center">
            <p>-2.2</p>
         </c>
         <c ca="center">
            <p>-0.5</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>CNS</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>2.1</p>
         </c>
         <c ca="center">
            <p>1.8</p>
         </c>
         <c ca="center">
            <p>2.2</p>
         </c>
         <c ca="center">
            <p>3.1</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>0.8</p>
         </c>
         <c ca="center">
            <p>1.0</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
         <c ca="center">
            <p>1.6</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>1.2</p>
         </c>
         <c ca="center">
            <p>0.0</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>1.9</p>
         </c>
         <c ca="center">
            <p>2.2</p>
         </c>
         <c ca="center">
            <p>2.4</p>
         </c>
         <c ca="center">
            <p>1.3</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center">
            <p>Breast</p>
            <p>Cancer</p>
         </c>
         <c ca="center">
            <p>NBC-MMC</p>
         </c>
         <c ca="center">
            <p>0.2</p>
         </c>
         <c ca="center">
            <p>1.3</p>
         </c>
         <c ca="center">
            <p>0.5</p>
         </c>
         <c ca="center">
            <p>1.5</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MMC</p>
         </c>
         <c ca="center">
            <p>0.6</p>
         </c>
         <c ca="center">
            <p>3.2</p>
         </c>
         <c ca="center">
            <p>-1.2</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NBC-MSC</p>
         </c>
         <c ca="center">
            <p>0.0</p>
         </c>
         <c ca="center">
            <p>1.7</p>
         </c>
         <c ca="center">
            <p>-1.6</p>
         </c>
         <c ca="center">
            <p>-0.6</p>
         </c>
      </r>
      <r>
         <c>
            <p/>
         </c>
         <c ca="center">
            <p>NMSC-MSC</p>
         </c>
         <c ca="center">
            <p>1.7</p>
         </c>
         <c ca="center">
            <p>1.3</p>
         </c>
         <c ca="center">
            <p>-1.1</p>
         </c>
         <c ca="center">
            <p>1.0</p>
         </c>
      </r>
      <r>
         <c cspan="6">
            <hr/>
         </c>
      </r>
      <r>
         <c ca="center" cspan="2">
            <p>Average</p>
         </c>
         <c ca="center">
            <p>0.8</p>
         </c>
         <c ca="center">
            <p>0.7</p>
         </c>
         <c ca="center">
            <p>0.4</p>
         </c>
         <c ca="center">
            <p>0.9</p>
         </c>
      </r>
   </tblbdy></tbl>
         </sec>
         <sec>
            <st>
               <p>Comparison of LPPO and varSelRF</p>
            </st>
            <p>Figure <figr fid="F2">2</figr> gives the boxplots of the testing values with the use of learning classifier random forest for the feature sets from LPPO with RFA and varSelRF. The gene selection methods are NBC-MMC, NMSC-MMC, NBC-MSC, NMSC-MSC, and varSelRF from left to right in each subfigure. Figure <figr fid="F2">2</figr> indicates that the testing accuracies by applying random forest to the feature sets of LPPO with RFA are better than those of varSelRF. In comparison with varSelRF, LPPO with RFA increases the average testing accuracy by about 5% for the leukemia data set, 9% for lymphoma, 3% for colon and prostate, 10% for CNS, and 14% for the breast cancer data set.</p>
            <fig id="F2"><title><p>Figure 2</p></title><caption><p>Boxplots of testing accuracies of the LPPO with four gene selection methods using two different classifiers (NBC, NMSC) compared to varSelRF for six data sets</p></caption><text>
   <p><b>Boxplots of testing accuracies of the LPPO with four gene selection methods using two different classifiers (NBC, NMSC) compared to varSelRF for six data sets</b>. RF is the final classifier. All six data sets demonstrate that varSelRF accuracies are lower than our proposed feature selection and optimization algorithm with the same RF classifier.</p>
</text><graphic file="1471-2164-12-S5-S1-2"/></fig>
         </sec>
         <sec>
            <st>
               <p>Computational efficiency</p>
            </st>
            <p>In microarray data analysis, generally, the number of features in the final feature set is far smaller than the total variables. Suppose the number of total variables is <it>n</it>, the number of features of the final feature set is <it>m </it>(<it>m </it>&lt;&lt;<it>n</it>). In forward feature selection, with the use of some learning classifier, the computational time is <it>F</it>(<it>s</it>, <it>d</it>) for a <it>s</it>&#215;<it>d </it>feature matrix, here <it>s </it>is the number of data samples (s &lt;&lt; n) and <it>d </it>is the feature dimensionality at each sample. Without losing the generality, if <it>d</it><sub>1</sub>&lt;<it>d</it><sub>2</sub>, <it>F</it>(<it>s</it>, <it>d</it><sub>1</sub>) &lt;<it>F</it>(<it>s</it>, <it>d</it><sub>2</sub>). The computational cost of our feature selection algorithm is analyzed as follows.</p>
            <p>Let T<sub>1 </sub>denote the total computational time for supervised learning</p>
            <p>
               <display-formula id="M4">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i4"><m:mrow>
   <m:mtable class="aligned">
      <m:mtr>
         <m:mtd columnalign="right">
            <m:msub>
               <m:mrow>
                  <m:mi>T</m:mi>
               </m:mrow>
               <m:mrow>
                  <m:mn>1</m:mn>
               </m:mrow>
            </m:msub>
         </m:mtd>
         <m:mtd columnalign="left">
            <m:mo class="MathClass-rel">=</m:mo>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mi>n</m:mi>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>F</m:mi>
            <m:mfenced close=")" open="(" separators="">
               <m:mrow>
                  <m:mi>s</m:mi>
                  <m:mo class="MathClass-punc">,</m:mo>
                  <m:mn>1</m:mn>
               </m:mrow>
            </m:mfenced>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mfenced close=")" open="(" separators="">
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:mn>1</m:mn>
               </m:mrow>
            </m:mfenced>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>F</m:mi>
            <m:mfenced close=")" open="(" separators="">
               <m:mrow>
                  <m:mi>s</m:mi>
                  <m:mo class="MathClass-punc">,</m:mo>
                  <m:mn>2</m:mn>
               </m:mrow>
            </m:mfenced>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mo class="MathClass-op">&#8230;</m:mo>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mstyle class="text">
               <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
            </m:mstyle>
            <m:mfenced close=")" open="(" separators="">
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:mi>m</m:mi>
                  <m:mo class="MathClass-bin">+</m:mo>
                  <m:mn>1</m:mn>
               </m:mrow>
            </m:mfenced>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>F</m:mi>
            <m:mfenced close=")" open="(" separators="">
               <m:mrow>
                  <m:mi>s</m:mi>
                  <m:mo class="MathClass-punc">,</m:mo>
                  <m:mi>m</m:mi>
               </m:mrow>
            </m:mfenced>
         </m:mtd>
         <m:mtd columnalign="right"/>
      </m:mtr>
      <m:mtr>
         <m:mtd columnalign="right">
            <m:mo class="MathClass-rel">&#8804;</m:mo>
            <m:mfenced close="]" open="[" separators="">
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">+</m:mo>
                  <m:mrow>
                     <m:mo class="MathClass-open">(</m:mo>
                     <m:mrow>
                        <m:mi>n</m:mi>
                        <m:mo class="MathClass-bin">-</m:mo>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mo class="MathClass-close">)</m:mo>
                  </m:mrow>
                  <m:mo class="MathClass-bin">+</m:mo>
                  <m:mo class="MathClass-punc">.</m:mo>
                  <m:mo class="MathClass-punc">.</m:mo>
                  <m:mo class="MathClass-punc">.</m:mo>
                  <m:mo class="MathClass-bin">+</m:mo>
                  <m:mrow>
                     <m:mo class="MathClass-open">(</m:mo>
                     <m:mrow>
                        <m:mi>n</m:mi>
                        <m:mo class="MathClass-bin">-</m:mo>
                        <m:mi>m</m:mi>
                        <m:mo class="MathClass-bin">+</m:mo>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mo class="MathClass-close">)</m:mo>
                  </m:mrow>
               </m:mrow>
            </m:mfenced>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>F</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
                  <m:mo class="MathClass-punc">,</m:mo>
                  <m:mi>m</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
         </m:mtd>
         <m:mtd columnalign="left"/>
      </m:mtr>
      <m:mtr>
         <m:mtd columnalign="right">
            <m:mo class="MathClass-rel">=</m:mo>
            <m:mfrac>
               <m:mrow>
                  <m:mi>m</m:mi>
                  <m:mo class="MathClass-bin">*</m:mo>
                  <m:mrow>
                     <m:mo class="MathClass-open">(</m:mo>
                     <m:mrow>
                        <m:mn>2</m:mn>
                        <m:mo class="MathClass-bin">*</m:mo>
                        <m:mi>n</m:mi>
                        <m:mo class="MathClass-bin">-</m:mo>
                        <m:mi>m</m:mi>
                        <m:mo class="MathClass-bin">+</m:mo>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mo class="MathClass-close">)</m:mo>
                  </m:mrow>
               </m:mrow>
               <m:mrow>
                  <m:mn>2</m:mn>
               </m:mrow>
            </m:mfrac>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>F</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
                  <m:mo class="MathClass-punc">,</m:mo>
                  <m:mi>m</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
         </m:mtd>
         <m:mtd columnalign="left"/>
      </m:mtr>
      <m:mtr>
         <m:mtd columnalign="right"/>
      </m:mtr>
   </m:mtable>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>Let T<sub>2 </sub>denote the computational time for similarity calculation among the candidates and chosen genes, the calculation time between two single- variant vectors with s samples is C(s), then</p>
            <p>
               <display-formula id="M5">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i5"><m:mrow>
   <m:mtable class="aligned">
      <m:mtr>
         <m:mtd columnalign="right">
            <m:msub>
               <m:mrow>
                  <m:mi>T</m:mi>
               </m:mrow>
               <m:mrow>
                  <m:mn>2</m:mn>
               </m:mrow>
            </m:msub>
         </m:mtd>
         <m:mtd columnalign="left">
            <m:mo class="MathClass-rel">&#8804;</m:mo>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:mn>1</m:mn>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>C</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mn>2</m:mn>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:mn>2</m:mn>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>C</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mo class="MathClass-punc">.</m:mo>
            <m:mo class="MathClass-punc">.</m:mo>
            <m:mo class="MathClass-punc">.</m:mo>
            <m:mo class="MathClass-bin">+</m:mo>
            <m:mi>m</m:mi>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>n</m:mi>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:mi>m</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mi>C</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
         </m:mtd>
         <m:mtd columnalign="right"/>
      </m:mtr>
      <m:mtr>
         <m:mtd columnalign="right">
            <m:mo class="MathClass-rel">=</m:mo>
            <m:mi>C</m:mi>
            <m:mrow>
               <m:mo class="MathClass-open">(</m:mo>
               <m:mrow>
                  <m:mi>s</m:mi>
               </m:mrow>
               <m:mo class="MathClass-close">)</m:mo>
            </m:mrow>
            <m:mo class="MathClass-bin">*</m:mo>
            <m:mfenced close="}" open="{" separators="">
               <m:mrow>
                  <m:mfrac>
                     <m:mrow>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mrow>
                        <m:mn>2</m:mn>
                     </m:mrow>
                  </m:mfrac>
                  <m:mi>n</m:mi>
                  <m:mi>m</m:mi>
                  <m:mrow>
                     <m:mo class="MathClass-open">(</m:mo>
                     <m:mrow>
                        <m:mi>m</m:mi>
                        <m:mo class="MathClass-bin">+</m:mo>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mo class="MathClass-close">)</m:mo>
                  </m:mrow>
                  <m:mo class="MathClass-bin">-</m:mo>
                  <m:munderover accent="false" accentunder="false">
                     <m:mrow>
                        <m:mo mathsize="big">&#8721;</m:mo>
                     </m:mrow>
                     <m:mrow>
                        <m:mi>i</m:mi>
                        <m:mo class="MathClass-rel">=</m:mo>
                        <m:mn>1</m:mn>
                     </m:mrow>
                     <m:mrow>
                        <m:mi>m</m:mi>
                     </m:mrow>
                  </m:munderover>
                  <m:msup>
                     <m:mrow>
                        <m:mi>i</m:mi>
                     </m:mrow>
                     <m:mrow>
                        <m:mn>2</m:mn>
                     </m:mrow>
                  </m:msup>
               </m:mrow>
            </m:mfenced>
         </m:mtd>
         <m:mtd columnalign="left"/>
      </m:mtr>
      <m:mtr>
         <m:mtd columnalign="right"/>
      </m:mtr>
   </m:mtable>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>Due to the fact of m &lt;&lt; n and s &lt;&lt; n with microarray data, the computational cost of our feature selection is obtained by</p>
            <p>
               <display-formula id="M6">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i6"><m:mrow>
   <m:mi>T</m:mi>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:msub>
      <m:mrow>
         <m:mi>T</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">1</m:mtext>
         </m:mstyle>
      </m:mrow>
   </m:msub>
   <m:mo class="MathClass-bin">+</m:mo>
   <m:msub>
      <m:mrow>
         <m:mi>T</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mn>2</m:mn>
      </m:mrow>
   </m:msub>
   <m:mo class="MathClass-rel">~</m:mo>
   <m:mi>O</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>n</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusions</p>
         </st>
         <p>Our study shows that our gene selection method Recursive Feature Addition (RFA) obtained the best classification performance in the comparison. RFA utilizes supervised learning to obtain the best classification, and indentifies the subsequent gene recursively based on the similarity measures between the chosen gene set and the candidates to minimize the redundancy of the genes within the selected subset; hence it obtains more informative and differently expressed genes. Based on RFA, we also propose an algorithm, Lagging Prediction Peephole Optimization (LPPO), to determine the optimal feature set. Using six popular benchmark data sets, we compared RFA with other gene selection methods. Our studies showed that RFA outperformed other methods with the use of the four popular classifiers: NMSC, NBC, SVM, and random forest. Results also showed that, on average, LPPO is superior to a random strategy under the best training and that it outperformed the random forest based gene selection method varSelRF.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Supervised recursive learning</p>
            </st>
            <p>Our method of RFA uses supervised learning to achieve the highest level of training accuracy and statistical similarity measures to choose the next variable with the least dependence on or correlation to the already identified variables as follows:</p>
            <p>1. Insignificant genes are removed according to their statistical insignificance. Specifically, a gene with a high p-value is usually not differently expressed and therefore has little contribution in distinguishing normal tissues from tumor tissues or in classifying different types of tissues. To reduce the computational load, those genes should be removed. The filtered gene data is then normalized. Here we use the standard normalization method, MANORM, which is available from MATLAB bioinformatics toolbox.</p>
            <p>2. Each individual gene is selected by supervised learning. A gene with highest classification accuracy is chosen as the most important feature and the first element of the feature set. If multiple genes achieve the same highest classification accuracy, the one with the lowest <it>p</it>-value measured by test-statistics (e.g., score test), is the target of the first element. At this point the chosen feature set, <b>G</b><sub>1</sub>, contains just one element, <it>g</it><sub>1</sub>, corresponding to the feature dimension one.</p>
            <p>3. The (<it>N</it>+1)<sup>st </sup>dimension feature set, <b>G</b><sub><it>N</it>+1 </sub>= {<it>g</it><sub>1, </sub><it>g</it><sub>2</sub>, ..., <it>g<sub>N</sub></it>, <it>g</it><sub><it>N</it>+1</sub>} is obtained by adding <it>g</it><sub><it>N</it>+1 </sub>to the <it>N</it><sup><it>th </it></sup>dimension feature set, <b>G</b><sub><it>N </it></sub>= {<it>g</it><sub>1, </sub><it>g</it><sub>2</sub>, ..., <it>g<sub>N</sub></it>}. The choice of <it>g</it><sub><it>N</it>+1 </sub>is described as follows:</p>
            <p>Add each gene <it>g<sub>i </sub></it>(<it>g<sub>i </sub></it>&#8713; <b>G</b><it><sub>N</sub></it>) into <b>G</b><it><sub>N </sub></it>and obtain the classification accuracy of the feature set <b>G</b><it><sub>N </sub></it>&#8746;{<it>g<sub>i</sub></it>}. The <it>g<sub>i </sub></it>(<it>g<sub>i </sub></it>&#8713; <b>G</b><it><sub>N</sub></it>) associated with the group, <b>G</b><it><sub>N </sub></it>&#8746;{<it>g<sub>i</sub></it>} that obtains the highest classification accuracy, is the candidate for <it>g</it><sub><it>N</it>+1 </sub>(not yet <it>g</it><sub><it>N</it>+1</sub>). Considering the large number of variables, it is highly possible that multiple features correspond to the same highest classification accuracy. These multiple candidates are placed into the set <b>C</b>, but only one candidate from <b>C </b>will be identified as <it>g</it><sub><it>N+1</it></sub>. How to make the selection is described next.</p>
         </sec>
         <sec>
            <st>
               <p>Candidate feature addition</p>
            </st>
            <p>To find the most informative (or least redundant) next feature <it>g</it><sub><it>N</it>+1</sub>, two formulas may be designed by measuring the statistical similarity between the chosen feature set and each candidate. Here we use, say, Pearson's correlation coefficient <abbrgrp><abbr bid="B28">28</abbr></abbrgrp> between chosen features <it>g<sub>n </sub></it>(<it>g<sub>n </sub></it>&#8712; <b>G</b><it><sub>N </sub>, n = </it>1, 2, <it>..</it>., <it>N</it>) and candidate <it>g<sub>c </sub></it>(<it>g<sub>c </sub></it>&#8712; <b>C</b>) to measure the similarity.</p>
            <p>In the first formula, the sum of the square of the correlation, SC, is calculated to measure the similarity and is defined as follows:</p>
            <p>
               <display-formula id="M7">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i7"><m:mrow>
   <m:mstyle class="text">
      <m:mtext class="textsf" mathvariant="sans-serif">SC</m:mtext>
   </m:mstyle>
   <m:mfenced close=")" open="(" separators="">
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
      </m:mrow>
   </m:mfenced>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:munderover accent="false" accentunder="false">
      <m:mrow>
         <m:mo mathsize="big"> &#8721;</m:mo>
      </m:mrow>
      <m:mrow>
         <m:mi>n</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mn>1</m:mn>
      </m:mrow>
      <m:mrow>
         <m:mi>N</m:mi>
      </m:mrow>
   </m:munderover>
   <m:mstyle class="text">
      <m:mtext class="textsf" mathvariant="sans-serif">co</m:mtext>
   </m:mstyle>
   <m:msup>
      <m:mrow>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">r</m:mtext>
         </m:mstyle>
      </m:mrow>
      <m:mrow>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">2</m:mtext>
         </m:mstyle>
      </m:mrow>
   </m:msup>
   <m:mfenced close=")" open="(" separators="">
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">&#160;</m:mtext>
         </m:mstyle>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>n</m:mi>
            </m:mrow>
         </m:msub>
      </m:mrow>
   </m:mfenced>
   <m:mspace class="thinspace" width="0.3em"/>
   <m:mspace class="thinspace" width="0.3em"/>
   <m:mi>n</m:mi>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mn>1</m:mn>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mn>2</m:mn>
   <m:mspace class="thinspace" width="0.3em"/>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mi>N</m:mi>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>Where, <it>g<sub>c </sub></it>&#8712; <b>C</b><it>, g<sub>n </sub></it>&#8712; <b>G</b><it><sub>N</sub></it>.</p>
            <p>Then selection of <it>g</it><sub><it>N</it>+1 </sub>can be based on the Minimum Sum of the square of the Correlation (MSC), that is,</p>
            <p>
               <display-formula id="M8">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i8"><m:mrow>
   <m:msub>
      <m:mrow>
         <m:mi>g</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mi>N</m:mi>
         <m:mo class="MathClass-bin">+</m:mo>
         <m:mn>1</m:mn>
      </m:mrow>
   </m:msub>
   <m:mo class="MathClass-rel">&#8592;</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">{</m:mo>
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-rel">|</m:mo>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">SC</m:mtext>
         </m:mstyle>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:msub>
                  <m:mrow>
                     <m:mi>g</m:mi>
                  </m:mrow>
                  <m:mrow>
                     <m:mi>c</m:mi>
                  </m:mrow>
               </m:msub>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mo class="qopname"> min</m:mo>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mstyle class="text">
                  <m:mtext class="textsf" mathvariant="sans-serif">SC</m:mtext>
               </m:mstyle>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-rel">&#8712;</m:mo>
         <m:mstyle mathvariant="bold">
            <m:mi>C</m:mi>
         </m:mstyle>
      </m:mrow>
      <m:mo class="MathClass-close">}</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>In the second formula, the maximum value of the square of the correlation, MC, is calculated:</p>
            <p>
               <display-formula id="M9">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i9"><m:mrow>
   <m:mstyle class="text">
      <m:mtext class="textsf" mathvariant="sans-serif">MC</m:mtext>
   </m:mstyle>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mo class="qopname"> max</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">co</m:mtext>
         </m:mstyle>
         <m:msup>
            <m:mrow>
               <m:mstyle class="text">
                  <m:mtext class="textsf" mathvariant="sans-serif">r</m:mtext>
               </m:mstyle>
            </m:mrow>
            <m:mrow>
               <m:mn>2</m:mn>
            </m:mrow>
         </m:msup>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:msub>
                  <m:mrow>
                     <m:mi>g</m:mi>
                  </m:mrow>
                  <m:mrow>
                     <m:mi>c</m:mi>
                  </m:mrow>
               </m:msub>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:msub>
                  <m:mrow>
                     <m:mi>g</m:mi>
                  </m:mrow>
                  <m:mrow>
                     <m:mi>n</m:mi>
                  </m:mrow>
               </m:msub>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mspace class="tmspace" width="2.77695pt"/>
   <m:mspace class="tmspace" width="2.77695pt"/>
   <m:mi>n</m:mi>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mn>1</m:mn>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mn>2</m:mn>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mo class="MathClass-punc">.</m:mo>
   <m:mo class="MathClass-punc">,</m:mo>
   <m:mi>N</m:mi>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>Where, <it>g<sub>c </sub></it>&#8712; <b>C</b><it>, g<sub>n </sub></it>&#8712; <b>G</b><it><sub>N</sub></it>.</p>
            <p>The selection of <it>g<sub>N+1 </sub></it>follows the criterion that the MC value is the minimum, which we call Minimum of Maximum value of the square of the Correlation (MMC).</p>
            <p>
               <display-formula id="M10">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i10"><m:mrow>
   <m:msub>
      <m:mrow>
         <m:mi>g</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mi>N</m:mi>
         <m:mo class="MathClass-bin">+</m:mo>
         <m:mn>1</m:mn>
      </m:mrow>
   </m:msub>
   <m:mo class="MathClass-rel">&#8592;</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">{</m:mo>
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-rel">|</m:mo>
         <m:mstyle class="text">
            <m:mtext class="textsf" mathvariant="sans-serif">MC</m:mtext>
         </m:mstyle>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:msub>
                  <m:mrow>
                     <m:mi>g</m:mi>
                  </m:mrow>
                  <m:mrow>
                     <m:mi>c</m:mi>
                  </m:mrow>
               </m:msub>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mo class="qopname"> min</m:mo>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mstyle class="text">
                  <m:mtext class="textsf" mathvariant="sans-serif">MC</m:mtext>
               </m:mstyle>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-punc">.</m:mo>
         <m:msub>
            <m:mrow>
               <m:mi>g</m:mi>
            </m:mrow>
            <m:mrow>
               <m:mi>c</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-rel">&#8712;</m:mo>
         <m:mstyle mathvariant="bold">
            <m:mi>C</m:mi>
         </m:mstyle>
      </m:mrow>
      <m:mo class="MathClass-close">}</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>In the methods mentioned above, a feature is recursively added to the chosen feature set based on supervised learning and the similarity measures. With the use of a classifier XXX, we call the first gene selection method XXX-MSC and the second one XXX-MMC. For example, if the classifier is Naive Bayes Classifier (NBC), we call the two strategies NBC-MSC and NBC-MMC, respectively.</p>
         </sec>
         <sec>
            <st>
               <p>Lagging Prediction Peephole Optimization (LPPO)</p>
            </st>
            <p>We want to find a combination of features (genes) that yields the best performance on breaking down solvents. Normally, with the recursive addition for the next feature, the training accuracy will increase and reach a peak classification performance at some point, and then may maintain it with subsequent feature additions; but after that the training accuracy may decrease. Generally speaking, all strategies for determining the final feature set should be based on the best training classification. In high-volume data analysis, it is common that the best training accuracy corresponds to different feature sets; that is, multiple feature sets achieve the same highest training accuracy. However, although all these feature sets are associated with the same highest training accuracy, the testing accuracy of these feature sets may be different. Among these highest training feature sets, the one having the best testing accuracy is called the optimal feature set, which is highly complicated to characterize when a sample size is small. Either applying different gene methods to the same training samples, or applying the same gene selection method to different training samples, or applying different learning classifiers to the same training samples, will produce a different optimization of the feature set. Pochet <it>et al. </it><abbrgrp><abbr bid="B29">29</abbr></abbrgrp> presented a method of determining the optimal number of genes by means of a cross-validation procedure; the drawback of this method is that it actually utilizes whole data information, including training samples and testing samples.</p>
            <p>How do we choose the optimal feature set? If there are multiple best training classifications, a random choice, called random strategy, works for best training classification. In the recursive addition of the features, for training samples, a classification model is one of the best methods. But for testing samples, at this point, the classification model may not be optimal because of the difference between the training samples and the testing samples; the optimal classification model will lag in appearance (see Figure <figr fid="F1">1</figr>). Based on this observation, we propose the following algorithm for optimization.</p>
            <p>Under feature dimension <it>j</it>, the training accuracy of the <it>i</it><sup>th </sup>experiment is <it>r</it>(<it>i, j</it>). If the feature set <b>G</b><it><sub>k</sub></it>, corresponding to feature dimension <it>k</it>, has the best training accuracy in the trainings from the feature set <b>G</b><sub>1 </sub>to <b>G</b><sub>D</sub>, corresponding to the feature dimensions from 1 to D, let <b>HR </b>denote the set that contains all the combinations of <b>G</b><it><sub>k</sub></it>, corresponding to all the feature set having the highest classification accuracy under feature dimension 1 to D.</p>
            <p>
               <display-formula id="M11">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i11"><m:mrow>
   <m:mstyle mathvariant="bold">
      <m:mi>H</m:mi>
      <m:mi>R</m:mi>
   </m:mstyle>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">{</m:mo>
      <m:mrow>
         <m:msub>
            <m:mrow>
               <m:mstyle mathvariant="bold">
                  <m:mi>G</m:mi>
               </m:mstyle>
            </m:mrow>
            <m:mrow>
               <m:mi>k</m:mi>
            </m:mrow>
         </m:msub>
         <m:mo class="MathClass-rel">|</m:mo>
         <m:mi>r</m:mi>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mi>i</m:mi>
               <m:mo class="MathClass-punc">,</m:mo>
               <m:mi>k</m:mi>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mo class="qopname"> max</m:mo>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mi>r</m:mi>
               <m:mrow>
                  <m:mo class="MathClass-open">(</m:mo>
                  <m:mrow>
                     <m:mi>i</m:mi>
                     <m:mo class="MathClass-punc">,</m:mo>
                     <m:mo class="MathClass-bin">&#8729;</m:mo>
                  </m:mrow>
                  <m:mo class="MathClass-close">)</m:mo>
               </m:mrow>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mspace class="tmspace" width="2.77695pt"/>
         <m:mspace class="tmspace" width="2.77695pt"/>
         <m:mn>1</m:mn>
         <m:mo class="MathClass-rel">&#8804;</m:mo>
         <m:mi>k</m:mi>
         <m:mo class="MathClass-rel">&#8804;</m:mo>
         <m:mi>D</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">}</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>In general, the best classification model for testing samples will lag in appearance behind the initial best training model. We will exclude the elements of <b>HR </b>that correspond to the initial best training. The remaining elements in <b>HR </b>constitute the candidate set <b>HRC </b>for optimization.</p>
            <p>Each element in <b>HRC </b>is associated with the best training accuracy. We set a peephole for each element and choose the element associated with the optimal peephole. The details are described as follows:</p>
            <p>a. For each element <b>G</b><it><sub>k </sub></it>&#8712; <b>HRC</b>, the peephole over <b>G</b><it><sub>k </sub></it>with length of 2<it>l</it>+1 covers the feature sets <b>G</b><it><sub>k-l</sub></it>, <b>G</b><sub><it>k-l+</it>1</sub>, ..., <b>G</b><it><sub>k </sub></it>, ..., <b>G</b><sub><it>k+l</it>-1</sub>, <b>G</b><it><sub>k+l</sub></it>, corresponding to the training accuracy <it>r</it>(<it>i, k-l</it>), <it>r</it>(<it>i, k-l+</it>1), ..., <it>r</it>(<it>i, k</it>), ..., <it>r</it>(<it>i, k+l-</it>1), <it>r</it>(<it>i, k+l</it>). The mean training value of the peephole is denoted by mp_r(<it>i</it>, <it>k</it>).</p>
            <p>
               <display-formula id="M12">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i12"><m:mrow>
   <m:mi>m</m:mi>
   <m:mi>p</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>r</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>k</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mn>1</m:mn>
         <m:mo class="MathClass-bin">&#8725;</m:mo>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mn>2</m:mn>
               <m:mi>l</m:mi>
               <m:mo class="MathClass-bin">+</m:mo>
               <m:mn>1</m:mn>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:msubsup>
      <m:mrow>
         <m:mo mathsize="big">&#8721;</m:mo>
      </m:mrow>
      <m:mrow>
         <m:mi>m</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mi>k</m:mi>
         <m:mo class="MathClass-bin">-</m:mo>
         <m:mi>l</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mi>m</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mi>k</m:mi>
         <m:mo class="MathClass-bin">+</m:mo>
         <m:mi>l</m:mi>
      </m:mrow>
   </m:msubsup>
   <m:mi>r</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>m</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>The peephole with the best classification of mp_r is then chosen as the optimal one.</p>
            <p>b. If there are multiple optimal peepholes, then we apply random forest to these peepholes and check the mean values of the Out-of-Bag (OOB) error rates <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr><abbr bid="B30">30</abbr></abbrgrp>. The feature sets <b>G</b><it><sub>k-l</sub></it>, <b>G</b><sub><it>k-l</it>+1</sub>, ..., <b>G</b><sub><it>k</it>,</sub>, ..., <b>G</b><sub><it>k+l</it>-1, </sub><b>G</b><it><sub>k+l </sub></it>correspond to the OOB errors, oob_e(<it>i</it>, <it>k</it>-<it>l</it>), oob_e(<it>i</it>, <it>k</it>-<it>l+</it>1), ..., oob_e(<it>i</it>, <it>k</it>), ..., oob_e(<it>i</it>, <it>k</it>+<it>l-</it>1), oob_e(<it>i</it>, <it>k+l</it>). The mean value of the OOB errors is denoted by mp_oob_e(<it>i</it>, <it>k</it>)</p>
            <p>
               <display-formula id="M13">
                  <m:math xmlns:m="http://www.w3.org/1998/Math/MathML" name="1471-2164-12-S5-S1-i13"><m:mrow>
   <m:mi>m</m:mi>
   <m:mi>p</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>o</m:mi>
   <m:mi>o</m:mi>
   <m:mi>b</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>e</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>k</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:mo class="MathClass-rel">=</m:mo>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mn>1</m:mn>
         <m:mo class="MathClass-bin">&#8725;</m:mo>
         <m:mrow>
            <m:mo class="MathClass-open">(</m:mo>
            <m:mrow>
               <m:mn>2</m:mn>
               <m:mi>l</m:mi>
               <m:mo class="MathClass-bin">+</m:mo>
               <m:mn>1</m:mn>
            </m:mrow>
            <m:mo class="MathClass-close">)</m:mo>
         </m:mrow>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
   <m:msubsup>
      <m:mrow>
         <m:mo mathsize="big">&#8721;</m:mo>
      </m:mrow>
      <m:mrow>
         <m:mi>m</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mi>k</m:mi>
         <m:mo class="MathClass-bin">-</m:mo>
         <m:mi>l</m:mi>
      </m:mrow>
      <m:mrow>
         <m:mi>m</m:mi>
         <m:mo class="MathClass-rel">=</m:mo>
         <m:mi>k</m:mi>
         <m:mo class="MathClass-bin">+</m:mo>
         <m:mi>l</m:mi>
      </m:mrow>
   </m:msubsup>
   <m:mi>o</m:mi>
   <m:mi>o</m:mi>
   <m:mi>b</m:mi>
   <m:mstyle class="text">
      <m:mtext>_</m:mtext>
   </m:mstyle>
   <m:mi>e</m:mi>
   <m:mrow>
      <m:mo class="MathClass-open">(</m:mo>
      <m:mrow>
         <m:mi>i</m:mi>
         <m:mo class="MathClass-punc">,</m:mo>
         <m:mi>m</m:mi>
      </m:mrow>
      <m:mo class="MathClass-close">)</m:mo>
   </m:mrow>
</m:mrow>
</m:math>
               </display-formula>
            </p>
            <p>The peephole with minimum mp_oob_e is the optimal one.</p>
            <p>c. If there are multiple peepholes corresponding to the best mp_r and minimum mp_oob_e, then set <it>l </it>+1 &#8594; <it>l</it>, and repeat 'a' to 'c', until a unique optimal peephole is determined.</p>
            <p>d. The feature set located at the center of the final optimal peephole is chosen as the final optimal feature set.</p>
            <p>This optimization of RFA is called Lagging Prediction Peephole Optimization (LPPO). Figure <figr fid="F3">3</figr> briefly outlines the LPPO on the prostate data set, which was studied by Singh <it>et a</it>l. <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>.</p>
            <fig id="F3"><title><p>Figure 3</p></title><caption><p>A sketch description of the Lagging Prediction Peephole Optimization on Prostate data set</p></caption><text>
   <p><b>A sketch description of the Lagging Prediction Peephole Optimization on Prostate data set</b>.</p>
</text><graphic file="1471-2164-12-S5-S1-3"/></fig>
         </sec>
         <sec>
            <st>
               <p>Data sets</p>
            </st>
            <p>The following six benchmark microarray data sets have been extensively studied and used in our experiments to compare the performances of our methods with others. Data sources that are not specified are available at: <url>http://www.broad.mit.edu/cgi-bin/cancer/datasets.cgi</url>.</p>
            <p>1) The LEUKEMIA data set consists of two types of acute leukemia: 48 acute lymphoblastic leukemia (ALL) samples and 25 acute myeloblastic leukemia (AML) samples with over 7129 probes from 6817 human genes. It was studied by Golub <it>et al. </it><abbrgrp><abbr bid="B32">32</abbr></abbrgrp>.</p>
            <p>2) The LYMPHOMA data set consists of 58 diffuse large B-cell lymphoma (DLBCL) samples and 19 follicular lymphoma (FL) samples. It was studied by Shipp <it>et al. </it><abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. The data file, lymphoma_8_lbc_fscc2_rn.res, and the class label file, lymphoma_8_lbc_fscc2.cls were used in our experiments for identifying DLBCL and FL.</p>
            <p>3) The PROSTATE data set used by Singh <it>et al. </it><abbrgrp><abbr bid="B31">31</abbr></abbrgrp> contains 52 prostate tumor samples and 50 non-tumor prostate samples.</p>
            <p>4) The COLON cancer data set used by Alon <it>et al. </it><abbrgrp><abbr bid="B34">34</abbr></abbrgrp> contains 62 samples collected from colon-cancer patients. Among them, 40 tumor biopsies are from tumors, and 22 normal biopsies are from healthy parts of the colons of the same patients. Based on the confidence in the measured expression levels, 2000 genes were selected. The data source is available at: <url>http://microarray.princeton.edu/oncology/affydata/index.html</url>.</p>
            <p>5) The Central Nervous System (CNS) embryonal tumor data set that was originally studied by Pomeroy <it>et al. </it><abbrgrp><abbr bid="B35">35</abbr></abbrgrp> contains 60 patient samples. Among them, 21 are survivors who are alive after treatment, and 39 are failures who succumbed to their diseases. There are 7129 genes.</p>
            <p>6) The Breast cancer data set studied by Van <it>et al. </it><abbrgrp><abbr bid="B36">36</abbr></abbrgrp> contains 97 patient samples, 46 of which are relapse patients who had developed distance metastases within 5 years, and 51 patients who are non-relapsed who remained healthy for at least 5 years from the distance after their initial diagnosis. This data source is available at: <url>http://www.rii.com/publications/2002/vantveer.htm</url>.</p>
         </sec>
         <sec>
            <st>
               <p>Experiments</p>
            </st>
            <p>Our experiments are designed as follows:</p>
            <p>1. The data sets are first divided randomly into training samples and testing samples. The ratio of training samples to testing samples is approximately 1:1 in each class.</p>
            <p>2. Recursive feature additions with Naive Bayes Classifier (NBC) and Nearest Mean Scaled Classifier (NMSC) for gene selection (NBC-MSC, NBC-MMC, NMSC-MSC, and NMSC-MMC) were applied to the training samples for gene selection. Different feature sets of the gene expression data are produced under feature dimensions 1 to 100. We compared the above proposed methods to several recently developed and published gene selection methods: LOOCSFS, GLGS, SVMRFE, SFFS-LS bound, SFS-LS bound, and also T-TEST.</p>
            <p>3. To compare different gene selection methods, the learning classifiers including NBC, NMSC, SVM <abbrgrp><abbr bid="B37">37</abbr><abbr bid="B38">38</abbr></abbrgrp>, and Random Forest are applied to the testing samples.</p>
            <p>4. The experiments were performed in 20 runs, and the average testing accuracies were compared to evaluate performance.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>QL designed the algorithms, performed the study, and wrote the draft; AHS supervised the study and revised the draft; ZC helped designing the algorithms and experiments, provided the statistical analysis, and co-drafted the manuscript; LC, JL, MQ, YP, ZW and HX participated in algorithm design, programming, and helped editing the draft; and YP coordinated the project and assisted the draft and data analyses</p>
      </sec>
      <sec>
         <st>
            <p>Competing interests</p>
         </st>
         <p>The authors do not claim any confliction of interests.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The authors are grateful to Matteo Masotti, E Ke Tang, and Xin Zhou for offering their codes of RfeRank, GLGS, LOOCSFS, SFS-LSbound, and SFFS-LSbound, to Ramon Diaz-Uriarte for the help with the use of varSelRF R package. Partial support for this study from the Institute for Complex Additive Systems Analysis, a division of New Mexico Tech, and from Sam Houston State University, is greatly acknowledged.</p>
         </sec>
      </ack>
      <refgrp><bibl id="B1"><title><p>A distribution free summarization method for Affymetrix GeneChip Arrays</p></title><aug><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>McGee</snm><fnm>M</fnm></au><au><snm>Liu</snm><fnm>Q</fnm></au><au><snm>Scheuermann</snm><fnm>RH</fnm></au></aug><source>Bioinformatics</source><pubdate>2007</pubdate><volume>23</volume><issue>3</issue><fpage>321</fpage><lpage>327</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btl609</pubid><pubid idtype="pmpid" link="fulltext">17148508</pubid></pubidlist></xrefbib></bibl><bibl id="B2"><title><p>Computational analysis of microarray data</p></title><aug><au><snm>Quackenbush</snm><fnm>J</fnm></au></aug><source>Nat Rev Genet</source><pubdate>2001</pubdate><volume>2</volume><issue>6</issue><fpage>418</fpage><lpage>427</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/35076576</pubid><pubid idtype="pmpid" link="fulltext">11389458</pubid></pubidlist></xrefbib></bibl><bibl id="B3"><title><p>Finding groups in gene expression data</p></title><aug><au><snm>Hand</snm><fnm>DJ</fnm></au><au><snm>Heard</snm><fnm>NA</fnm></au></aug><source>J Biomed Biotechnol</source><pubdate>2005</pubdate><issue>2</issue><fpage>215</fpage><lpage>225</lpage></bibl><bibl id="B4"><title><p>From signatures to models: understanding cancer using microarrays</p></title><aug><au><snm>Segal</snm><fnm>E</fnm></au><au><snm>Friedman</snm><fnm>N</fnm></au><au><snm>Kaminski</snm><fnm>N</fnm></au><au><snm>Regev</snm><fnm>A</fnm></au><au><snm>Koller</snm><fnm>D</fnm></au></aug><source>Nat Genet</source><pubdate>2005</pubdate><volume>37</volume><issue>Suppl</issue><fpage>S38</fpage><lpage>45</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">15920529</pubid></xrefbib></bibl><bibl id="B5"><title><p>A new algorithm for comparing and visualizing relationships between hierarchical and flat gene expression data clusterings</p></title><aug><au><snm>Torrente</snm><fnm>A</fnm></au><au><snm>Kapushesky</snm><fnm>M</fnm></au><au><snm>Brazma</snm><fnm>A</fnm></au></aug><source>Bioinformatics</source><pubdate>2005</pubdate><volume>21</volume><issue>21</issue><fpage>3993</fpage><lpage>3999</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/bti644</pubid><pubid idtype="pmpid" link="fulltext">16141251</pubid></pubidlist></xrefbib></bibl><bibl id="B6"><title><p>Clustering microarray gene expression data using weighted Chinese restaurant process</p></title><aug><au><snm>Qin</snm><fnm>Z</fnm></au></aug><source>Bioinformatics</source><pubdate>2006</pubdate><volume>22</volume><issue>16</issue><fpage>1988</fpage><lpage>1997</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/btl284</pubid><pubid idtype="pmpid" link="fulltext">16766561</pubid></pubidlist></xrefbib></bibl><bibl id="B7"><title><p>Standards for system biology</p></title><aug><au><snm>Brazma</snm><fnm>A</fnm></au><au><snm>Krestyaninova</snm><fnm>M</fnm></au><au><snm>Sarkans</snm><fnm>U</fnm></au></aug><source>Nat Rev Genet</source><pubdate>2006</pubdate><volume>7</volume><fpage>593</fpage><lpage>605</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">16847461</pubid></xrefbib></bibl><bibl id="B8"><title><p>On differential variability of expression ratios: improving statistical inference about gene expression changes from microarray data</p></title><aug><au><snm>Newton</snm><fnm>MA</fnm></au><au><snm>Kendziorski</snm><fnm>CM</fnm></au><au><snm>Richmond</snm><fnm>CS</fnm></au><au><snm>Blattner</snm><fnm>FR</fnm></au><au><snm>Tsui</snm><fnm>KW</fnm></au></aug><source>J Comput Biol</source><pubdate>2001</pubdate><volume>8</volume><issue>1</issue><fpage>37</fpage><lpage>52</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1089/106652701300099074</pubid><pubid idtype="pmpid" link="fulltext">11339905</pubid></pubidlist></xrefbib></bibl><bibl id="B9"><title><p>Improved statistical inference from DNA microarray data using analysis of variance and a Bayesian statistical framework</p></title><aug><au><snm>Long</snm><fnm>A</fnm></au><au><snm>Mangalam</snm><fnm>H</fnm></au><au><snm>Chan</snm><fnm>B</fnm></au><au><snm>Tolleri</snm><fnm>L</fnm></au><au><snm>Hatfield</snm><fnm>G</fnm></au><au><snm>Baldi</snm><fnm>P</fnm></au></aug><source>J Biol Chem</source><volume>276</volume><issue>23</issue><fpage>19937</fpage><lpage>19944</lpage></bibl><bibl id="B10"><title><p>New feature subset selection procedures for classification of expression profiles</p></title><aug><au><snm>Bo</snm><fnm>T</fnm></au><au><snm>Jonassen</snm><fnm>I</fnm></au></aug><source>Genome Biol</source><pubdate>2002</pubdate><volume>3</volume><issue>4</issue><fpage>research0017</fpage><xrefbib><pubidlist><pubid idtype="pmcid">115205</pubid><pubid idtype="pmpid" link="fulltext">11983058</pubid></pubidlist></xrefbib></bibl><bibl id="B11"><title><p>Bayesian neural network approaches to ovarian cancer identification from high-resolution mass spectrometry data</p></title><aug><au><snm>Yu</snm><fnm>J</fnm></au><au><snm>Chen</snm><fnm>X-W</fnm></au></aug><source>Bioinformatics</source><pubdate>2005</pubdate><volume>21</volume><issue>suppl 1</issue><fpage>i487</fpage><lpage>i494</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/bti1030</pubid><pubid idtype="pmpid" link="fulltext">15961495</pubid></pubidlist></xrefbib></bibl><bibl id="B12"><title><p>Analysis of strain and regional variation in gene expression in mouse brain</p></title><aug><au><snm>Pavlidis</snm><fnm>P</fnm></au><au><snm>Noble</snm><fnm>WS</fnm></au></aug><source>Genome Biol</source><pubdate>2001</pubdate><volume>2</volume><issue>10</issue><fpage>0042.1</fpage><lpage>0042.15</lpage></bibl><bibl id="B13"><title><p>Gene selection by sequential search wrapper approaches in microarray cancer class prediction</p></title><aug><au><snm>Inza</snm><fnm>I</fnm></au><au><snm>Sierra</snm><fnm>B</fnm></au><au><snm>Blanco</snm><fnm>R</fnm></au><au><snm>Larranaga</snm><fnm>P</fnm></au></aug><source>Journal of Intelligent and Fuzzy Systems</source><pubdate>2002</pubdate><volume>12</volume><issue>1</issue><fpage>25</fpage><lpage>33</lpage></bibl><bibl id="B14"><title><p>Gene selection for cancer classification using support vector machines</p></title><aug><au><snm>Guyon</snm><fnm>I</fnm></au><au><snm>Weston</snm><fnm>J</fnm></au><au><snm>Barnhill</snm><fnm>S</fnm></au><au><snm>Vapnik</snm><fnm>VN</fnm></au></aug><source>Machine Learning</source><pubdate>2002</pubdate><volume>46</volume><issue>19</issue><fpage>389</fpage><lpage>422</lpage></bibl><bibl id="B15"><title><p>Feature mining and pattern classification for steganalysis of LSB matching steganography in grayscale images</p></title><aug><au><snm>Liu</snm><fnm>Q</fnm></au><au><snm>Sung</snm><fnm>AH</fnm></au><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>Xu</snm><fnm>J</fnm></au></aug><source>Pattern Recognition</source><pubdate>2008</pubdate><volume>41</volume><issue>1</issue><fpage>56</fpage><lpage>66</lpage><xrefbib><pubid idtype="doi">10.1016/j.patcog.2007.06.005</pubid></xrefbib></bibl><bibl id="B16"><title><p>An improved approach to steganalysis of JPEG images</p></title><aug><au><snm>Liu</snm><fnm>Q</fnm></au><au><snm>Sung</snm><fnm>AH</fnm></au><au><snm>Qiao</snm><fnm>M</fnm></au><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>Ribeiro</snm><fnm>B</fnm></au></aug><source>Information Sciences</source><pubdate>2010</pubdate><volume>180</volume><issue>9</issue><fpage>1643</fpage><lpage>1655</lpage><xrefbib><pubid idtype="doi">10.1016/j.ins.2010.01.001</pubid></xrefbib></bibl><bibl id="B17"><title><p>Withdrawing an example from the training set: an analytic estimation of its effect on a nonlinear parameterized model</p></title><aug><au><snm>Monari</snm><fnm>G</fnm></au><au><snm>Dreyfus</snm><fnm>G</fnm></au></aug><source>Neurocomputing</source><pubdate>2000</pubdate><volume>35</volume><issue>1-4</issue><fpage>195</fpage><lpage>201</lpage><xrefbib><pubid idtype="doi">10.1016/S0925-2312(00)00325-8</pubid></xrefbib></bibl><bibl id="B18"><title><p>MLPs (Mono-Layer Polynomials and Multi-Layer Perceptrons) for nonlinear modeling</p></title><aug><au><snm>Rivals</snm><fnm>I</fnm></au><au><snm>Personnaz</snm><fnm>L</fnm></au></aug><source>Journal of Machine Learning Research</source><pubdate>2003</pubdate><volume>3</volume><fpage>1383</fpage><lpage>1398</lpage></bibl><bibl id="B19"><title><p>Regression shrinkage and selection via the lasso</p></title><aug><au><snm>Tibshirani</snm><fnm>R</fnm></au></aug><source>J Royal Statist Soc B</source><pubdate>1996</pubdate><volume>58</volume><issue>1</issue><fpage>267</fpage><lpage>288</lpage></bibl><bibl id="B20"><title><p>The lasso method for variable selection in the Cox model</p></title><aug><au><snm>Tibshirani</snm><fnm>R</fnm></au></aug><source>Stat Med</source><pubdate>1997</pubdate><volume>16</volume><issue>4</issue><fpage>385</fpage><lpage>395</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1002/(SICI)1097-0258(19970228)16:4&lt;385::AID-SIM380&gt;3.0.CO;2-3</pubid><pubid idtype="pmpid" link="fulltext">9044528</pubid></pubidlist></xrefbib></bibl><bibl id="B21"><title><p>Sparse multinomial logistic regression: fast algorithms, and generalization bounds</p></title><aug><au><snm>Krishnapuram</snm><fnm>B</fnm></au><au><snm>Carin</snm><fnm>L</fnm></au><au><snm>Figueiredo</snm><fnm>M</fnm></au><au><snm>Hartemink</snm><fnm>A</fnm></au></aug><source>IEEE Trans Pattern Anal Mach Intell</source><pubdate>2005</pubdate><volume>27</volume><issue>6</issue><fpage>957</fpage><lpage>968</lpage><xrefbib><pubid idtype="pmpid" link="fulltext">15943426</pubid></xrefbib></bibl><bibl id="B22"><title><p>LS bound based gene selection for DNA microarray data</p></title><aug><au><snm>Zhou</snm><fnm>X</fnm></au><au><snm>Mao</snm><fnm>K-Z</fnm></au></aug><source>Bioinformatics</source><pubdate>2005</pubdate><volume>21</volume><issue>8</issue><fpage>1559</fpage><lpage>1564</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/bti216</pubid><pubid idtype="pmpid" link="fulltext">15598834</pubid></pubidlist></xrefbib></bibl><bibl id="B23"><title><p>Gene selection algorithms for microarray data based on least square support vector machine</p></title><aug><au><snm>Tang</snm><fnm>E-K</fnm></au><au><snm>Suganthan</snm><fnm>PN</fnm></au><au><snm>Yao</snm><fnm>X</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2006</pubdate><volume>7</volume><fpage>95</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-7-95</pubid><pubid idtype="pmcid">1409801</pubid><pubid idtype="pmpid" link="fulltext">16504159</pubid></pubidlist></xrefbib></bibl><bibl id="B24"><title><p>Gene selection and classification of microarray data using random forest</p></title><aug><au><snm>Diaz-Uriarte</snm><fnm>R</fnm></au><au><snm>de Andres</snm><fnm>SA</fnm></au></aug><source>BMC Bioinformatics</source><pubdate>2006</pubdate><volume>7</volume><fpage>3</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1186/1471-2105-7-3</pubid><pubid idtype="pmcid">1363357</pubid><pubid idtype="pmpid" link="fulltext">16398926</pubid></pubidlist></xrefbib></bibl><bibl id="B25"><title><p>Random forests</p></title><aug><au><snm>Breiman</snm><fnm>L</fnm></au></aug><source>Machine Learning</source><pubdate>2001</pubdate><volume>45</volume><issue>1</issue><fpage>5</fpage><lpage>32</lpage><xrefbib><pubid idtype="doi">10.1023/A:1010933404324</pubid></xrefbib></bibl><bibl id="B26"><title><p>An introduction to variable and feature selection</p></title><aug><au><snm>Guyon</snm><fnm>I</fnm></au><au><snm>Elisseeff</snm><fnm>A</fnm></au></aug><source>Journal of Machine Learning Research</source><pubdate>2003</pubdate><volume>3</volume><fpage>1157</fpage><lpage>1182</lpage></bibl><bibl id="B27"><title><p>Feature selection and classification of MAQC-II breast cancer and multiple myeloma microarray gene expression data</p></title><aug><au><snm>Liu</snm><fnm>Q</fnm></au><au><snm>Sung</snm><fnm>AH</fnm></au><au><snm>Chen</snm><fnm>Z</fnm></au><au><snm>Liu</snm><fnm>J</fnm></au><au><snm>Huang</snm><fnm>X</fnm></au><au><snm>Deng</snm><fnm>Y</fnm></au></aug><source>PLoS One</source><pubdate>2009</pubdate><volume>4</volume><issue>12</issue><fpage>e8250</fpage><xrefbib><pubidlist><pubid idtype="doi">10.1371/journal.pone.0008250</pubid><pubid idtype="pmcid">2789385</pubid><pubid idtype="pmpid" link="fulltext">20011240</pubid></pubidlist></xrefbib></bibl><bibl id="B28"><aug><au><snm>Tan</snm><fnm>P</fnm></au><au><snm>Steinbach</snm><fnm>M</fnm></au><au><snm>Kumar</snm><fnm>V</fnm></au></aug><source>Introduction to Data Mining</source><publisher>Addison-Wesley</publisher><pubdate>2005</pubdate><fpage>76</fpage><lpage>79</lpage></bibl><bibl id="B29"><title><p>Systematic benchmarking of microarray data classification: assessing the role of non-linearity and dimensionality reduction</p></title><aug><au><snm>Pochet</snm><fnm>N</fnm></au><au><snm>De Smet</snm><fnm>F</fnm></au><au><snm>Suykens</snm><fnm>J</fnm></au><au><snm>De Moor</snm><fnm>B</fnm></au></aug><source>Bioinformatics</source><pubdate>2004</pubdate><volume>20</volume><issue>17</issue><fpage>3185</fpage><lpage>3195</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1093/bioinformatics/bth383</pubid><pubid idtype="pmpid" link="fulltext">15231531</pubid></pubidlist></xrefbib></bibl><bibl id="B30"><title><p>Classification and regression by random forest</p></title><aug><au><snm>Liaw</snm><fnm>A</fnm></au><au><snm>Wiener</snm><fnm>M</fnm></au></aug><source>R News</source><volume>2</volume><issue>3</issue><fpage>18</fpage><lpage>22</lpage></bibl><bibl id="B31"><title><p>Gene expression correlates of clinical prostate cancer behavior</p></title><aug><au><snm>Singh</snm><fnm>D</fnm></au><etal/></aug><source>Cancer Cell</source><pubdate>2002</pubdate><volume>1</volume><issue>2</issue><fpage>227</fpage><lpage>235</lpage></bibl><bibl id="B32"><title><p>Molecular classification of cancer: class discovery and class prediction by gene expression</p></title><aug><au><snm>Golub</snm><fnm>T</fnm></au><etal/></aug><source>Science</source><pubdate>1999</pubdate><volume>286</volume><issue>5439</issue><fpage>531</fpage><lpage>537</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1126/science.286.5439.531</pubid><pubid idtype="pmpid">10521349</pubid></pubidlist></xrefbib></bibl><bibl id="B33"><title><p>Diffuse large B-cell lymphoma outcome prediction by gene expression profiling and supervised machine learning</p></title><aug><au><snm>Shipp</snm><fnm>M</fnm></au><etal/></aug><source>Nat Med</source><pubdate>2002</pubdate><volume>8</volume><issue>1</issue><fpage>68</fpage><lpage>74</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/nm0102-68</pubid><pubid idtype="pmpid" link="fulltext">11786909</pubid></pubidlist></xrefbib></bibl><bibl id="B34"><title><p>Broad patterns of gene expression revealed by clustering analysis of tumor and normal colon tissues probed by oligonucleotide arrays</p></title><aug><au><snm>Alon</snm><fnm>U</fnm></au><etal/></aug><source>Proc Natl Acad Sci USA</source><pubdate>1999</pubdate><volume>96</volume><issue>12</issue><fpage>6745</fpage><lpage>6750</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1073/pnas.96.12.6745</pubid><pubid idtype="pmcid">21986</pubid><pubid idtype="pmpid" link="fulltext">10359783</pubid></pubidlist></xrefbib></bibl><bibl id="B35"><title><p>Prediction of central nervous system embryonal tumor outcome based on gene expression</p></title><aug><au><snm>Pomeroy</snm><fnm>SL</fnm></au><etal/></aug><source>Nature</source><pubdate>2002</pubdate><volume>415</volume><fpage>436</fpage><lpage>442</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/415436a</pubid><pubid idtype="pmpid" link="fulltext">11807556</pubid></pubidlist></xrefbib></bibl><bibl id="B36"><title><p>Gene expression profiling predicts clinical outcome of breast cancer</p></title><aug><au><snm>Van</snm><fnm>LJ</fnm></au><etal/></aug><source>Nature</source><pubdate>2002</pubdate><volume>415</volume><fpage>530</fpage><lpage>536</lpage><xrefbib><pubidlist><pubid idtype="doi">10.1038/415530a</pubid><pubid idtype="pmpid" link="fulltext">11823860</pubid></pubidlist></xrefbib></bibl><bibl id="B37"><aug><au><snm>Vapnik</snm><fnm>V</fnm></au></aug><source>Statistical Learning Theory</source><publisher>John Wiley</publisher><pubdate>1998</pubdate><note>ISBN-10: 0471030031</note></bibl><bibl id="B38"><aug><au><snm>Heijden</snm><fnm>F</fnm></au><au><snm>Duin</snm><fnm>R</fnm></au><au><snm>Ridder</snm><fnm>D</fnm></au><au><snm>Tax</snm><fnm>D</fnm></au></aug><source>Classification, Parameter Estimation and State Estimation</source><publisher>John Wiley</publisher><pubdate>2004</pubdate><note>ISBN-10: 0470090138</note></bibl></refgrp>
   </bm>
</art>