@article{ART002102138},
author={Hong Euyseok and 박미경},
title={Severity-based Software Quality Prediction using Class Imbalanced Data},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2016},
volume={21},
number={4},
pages={73-80}
TY - JOUR
AU - Hong Euyseok
AU - 박미경
TI - Severity-based Software Quality Prediction using Class Imbalanced Data
JO - Journal of The Korea Society of Computer and Information
PY - 2016
VL - 21
IS - 4
PB - The Korean Society Of Computer And Information
SP - 73
EP - 80
SN - 1598-849X
AB - Most fault prediction models have class imbalance problems because training data usually contains much more non-fault class modules than fault class ones. This imbalanced distribution makes it difficult for the models to learn the minor class module data. Data imbalance is much higher when severity-based fault prediction is used. This is because high severity fault modules is a smaller subset of the fault modules. In this paper, we propose severity-based models to solve these problems using the three sampling methods, Resample, SpreadSubSample and SMOTE. Empirical results show that Resample method has typical over-fit problems, and SpreadSubSample method cannot enhance the prediction performance of the models. Unlike two methods, SMOTE method shows good performance in terms of AUC and FNR values. Especially J48 decision tree model using SMOTE outperforms other prediction models.
KW - Data imbalance;Fault prediction;Severity;Sampling
DO -
UR -
ER -
Hong Euyseok and 박미경. (2016). Severity-based Software Quality Prediction using Class Imbalanced Data. Journal of The Korea Society of Computer and Information, 21(4), 73-80.
Hong Euyseok and 박미경. 2016, "Severity-based Software Quality Prediction using Class Imbalanced Data", Journal of The Korea Society of Computer and Information, vol.21, no.4 pp.73-80.
Hong Euyseok, 박미경 "Severity-based Software Quality Prediction using Class Imbalanced Data" Journal of The Korea Society of Computer and Information 21.4 pp.73-80 (2016) : 73.
Hong Euyseok, 박미경. Severity-based Software Quality Prediction using Class Imbalanced Data. 2016; 21(4), 73-80.
Hong Euyseok and 박미경. "Severity-based Software Quality Prediction using Class Imbalanced Data" Journal of The Korea Society of Computer and Information 21, no.4 (2016) : 73-80.
Hong Euyseok; 박미경. Severity-based Software Quality Prediction using Class Imbalanced Data. Journal of The Korea Society of Computer and Information, 21(4), 73-80.
Hong Euyseok; 박미경. Severity-based Software Quality Prediction using Class Imbalanced Data. Journal of The Korea Society of Computer and Information. 2016; 21(4) 73-80.
Hong Euyseok, 박미경. Severity-based Software Quality Prediction using Class Imbalanced Data. 2016; 21(4), 73-80.
Hong Euyseok and 박미경. "Severity-based Software Quality Prediction using Class Imbalanced Data" Journal of The Korea Society of Computer and Information 21, no.4 (2016) : 73-80.