@inproceedings{cc1fbd80898543c1845dd764ad9d3813,
title = "The Impact of Feature Selection on Defect Prediction Performance: An Empirical Comparison",
abstract = "Software defect prediction aims to determine whether a software module is defect-prone by constructing prediction models. The performance of such models is susceptible to the high dimensionality of the datasets that may include irrelevant and redundant features. Feature selection is applied to alleviate this issue. Because many feature selection methods have been proposed, there is an imperative need to analyze and compare these methods. Prior empirical studies may have potential controversies and limitations, such as the contradictory results, usage of private datasets and inappropriate statistical test techniques. This observation leads us to conduct a careful empirical study to reinforce the confidence of the experimental conclusions by considering several potential source of bias, such as the noise in the dataset and the dataset types. In this paper, we investigate the impact of 32 feature selection methods on the defect prediction performance over two versions of the NASA dataset (i.e., the noisy and clean NASA datasets) and one open source AEEEM dataset. We use a state-of-the-art double Scott-Knott test technique to analyze these methods. Experimental results show that the effectiveness of these feature selection methods on defect prediction performance varies significantly over all the datasets.",
keywords = "defect prediction, feature selection, Scott-Knott test",
author = "Zhou Xu and Jin Liu and Zijiang Yang and Gege An and Xiangyang Jia",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 27th IEEE International Symposium on Software Reliability Engineering, ISSRE 2016 ; Conference date: 23-10-2016 Through 27-10-2016",
year = "2016",
month = dec,
day = "5",
doi = "10.1109/ISSRE.2016.13",
language = "英语",
series = "Proceedings - International Symposium on Software Reliability Engineering, ISSRE",
publisher = "IEEE Computer Society",
pages = "309--320",
booktitle = "Proceedings - 2016 IEEE 27th International Symposium on Software Reliability Engineering, ISSRE 2016",
}