@article{8398e98efe7b4bd1bdc5f4a57bd66121,
title = "Hybrid clustering solution selection strategy",
abstract = "Cluster ensemble approaches make use of a set of clustering solutions which are derived from different data sources to gain a more comprehensive and significant clustering result over conventional single clustering approaches. Unfortunately, not all the clustering solutions in the ensemble contribute to the final result. In this paper, we focus on the clustering solution selection strategy in the cluster ensemble, and propose to view clustering solutions as features such that suitable feature selection techniques can be used to perform clustering solution selection. Furthermore, a hybrid clustering solution selection strategy (HCSS) is designed based on a proposed weighting function, which combines several feature selection techniques for the refinement of clustering solutions in the ensemble. Finally, a new measure is designed to evaluate the effectiveness of clustering solution selection strategies. The experimental results on both UCI machine learning datasets and cancer gene expression profiles demonstrate that HCSS works well on most of the datasets, obtains more desirable final results, and outperforms most of the state-of-the-art clustering solution selection strategies.",
keywords = "Cluster ensemble, Clustering solution selection, Feature selection, Hybrid strategy",
author = "Zhiwen Yu and Le Li and Yunjun Gao and Jane You and Jiming LIU and Wong, {Hau San} and Guoqiang Han",
note = "Funding Information: The authors are grateful for the constructive advice on the revision of the manuscript from the anonymous reviewers. The work described in this paper was partially funded by the grant from the Hong Kong Scholars Program (Project no. XJ2012015 ) and the outstanding talent training plan of South China University of Technology, and supported by grants from the National Natural Science Foundation of China (NSFC) (Project nos. 61003174 , 61070090 , 61273363 , and 61379033 ), the NSFC-Guangdong Joint Fund (Project nos. U1035004 ), the New Century Excellent Talents in University (Project no. NCET-11-0165 ), the Guangdong Natural Science Funds for Distinguished Young Scholar (Project no. S2013050014677 ), a grant from Science and Technology Planning Project of Guangzhou (Project no. 11A11080267 ), a grant from China Postdoctoral Science Foundation (Project no. 2013M540655 ), a grant from Foundation of Guangdong Educational Committee (Project no. 2012KJCX0011 ), a grant from the Fundamental Research Funds for the Central Universities (Project no. 2014G0007 ), a grant from Key Enterprises and Innovation Organizations in Nanshan District in Shenzhen (Project no. KC2013ZDZJ0007A ), a grant from Natural Science Foundation of Guangdong Province, China (Project no. S2012010009961 ), a grant from the Doctoral Program of Higher Education (Project no. 20110172120027 ), a grant from the Cooperation Project in Industry, Education and Academy of Guangdong Province and Ministry of Education of China (Project no. 2011B090400032 ), a grant from the key lab of cloud computing and big data in Guangzhou (Project no. SITGZ[2013]268-6 ), a grant from the City University of Hong Kong (Project no. 7004047 ), the grants from the Hong Kong Polytechnic University ( G-YK77 and G-YK53 ) and a grant from the Hong Kong Baptist University (Project no. RGC/HKBU211212). Funding Information: Zhiwen Yu is a professor in the School of Computer Science and Engineering, South China University of Technology, Guangzhou, China. He is a senior member of IEEE, a senior member of China Computer Federation (CCF), a member of Artificial Intelligence and Pattern Recognition Committee, and Multimedia Technology Committee in CCF. He is also a ACM member. Dr. Yu obtained the Ph.D. degree from City University of Hong Kong in 2008. He is supported by the program for New Century Excellent Talents in University in 2011, the program for Hong Kong Scholar in 2012 (Cooperation supervisor: IEEE Fellow, Prof. Jiming Liu) and the Guangdong natural science funds for distinguished young scholar in 2013. The research areas of Dr. Yu focus on data mining, machine learning, bioinformatics and pattern recognition. Until now, Dr. Yu has been published more than 80 referred journal papers and international conference papers, including TEC, TMM, TSMC-B, TCVST, TCBB, TNB, PR, IS, Bioinformatics, and so on. ",
year = "2014",
month = oct,
doi = "10.1016/j.patcog.2014.04.005",
language = "English",
volume = "47",
pages = "3362--3375",
journal = "Pattern Recognition",
issn = "0031-3203",
publisher = "Elsevier Ltd.",
number = "10",
}