@article{26472971fc2345b4925fdc52c1cdd78b,
title = "GD-RDA: A New Regularized Discriminant Analysis for High-Dimensional Data",
abstract = "High-throughput techniques bring novel tools and also statistical challenges to genomic research. Identification of which type of diseases a new patient belongs to has been recognized as an important problem. For high-dimensional small sample size data, the classical discriminant methods suffer from the singularity problem and are, therefore, no longer applicable in practice. In this article, we propose a geometric diagonalization method for the regularized discriminant analysis. We then consider a bias correction to further improve the proposed method. Simulation studies show that the proposed method performs better than, or at least as well as, the existing methods in a wide range of settings. A microarray dataset and an RNA-seq dataset are also analyzed and they demonstrate the superiority of the proposed method over the existing competitors, especially when the number of samples is small or the number of genes is large. Finally, we have developed an R package called {"}GDRDA{"} which is available upon request.",
keywords = "bias correction, classification, diagonalization, discriminant, geometric, microarray, RNA-seq",
author = "Yan Zhou and Baoxue Zhang and Gaorong Li and Tiejun Tong and Xiang Wan",
note = "Funding Information: The authors thank the editor, the associate editor, and the referees for their constructive comments that led to a substantial improvement of the paper. Xiang Wan{\textquoteright}s research was supported by Hong Kong RGC grant HKBU12202114 and the National Natural Science Foundation of China (Grant No. 61501389). Tiejun Tong{\textquoteright}s research was supported by the Hong Kong Baptist University grants FRG1/14-15/084, FRG2/15-16/019 and FRG2/15-16/038, and the National Natural Science Foundation of China (Grant No. 11671338). Yan Zhou{\textquoteright}s research was supported by Tianyuan fund for Mathematics (Grant No. 11526143), Doctor start fund of Guangdong Province [No. 2016A030310062 (85118-000043)], and The Natural Science Foundation of SZU (Grant No. 836-00008303). Gaorong Li{\textquoteright}s research was supported by the National Natural Science Foundation of China (Grant No. 11471029), the Beijing Natural Science Foundation (Grant No. 1142002), and the Science and Technology Project of Beijing Municipal Education Commission (Grant No. KM201410005010). Baoxue Zhang{\textquoteright}s research was supported by the National Science Foundation of China (Grant No. 11671268). The {\textquoteleft}{\textquoteleft}GDRDA{\textquoteright}{\textquoteright} package is made in the form of an R code, and the complete documentation is available on request from the corresponding author.",
year = "2017",
month = nov,
doi = "10.1089/cmb.2017.0029",
language = "English",
volume = "24",
pages = "1099--1111",
journal = "Journal of Computational Biology",
issn = "1066-5277",
publisher = "Mary Ann Liebert Inc.",
number = "11",
}