@inproceedings{508c5fb9b3074e54b36ba0c6ec4f9cf8,
title = "An Empirical Investigation to Overcome Class-Imbalance in Inspection Reviews",
abstract = "Background: software inspection results in reviews that report the presence of faults. Requirements author must manually read through the reviews and differentiate between true-faults and false-positives. Problem: post-inspection decisions (fault or nonfault) are difficult and time consuming. It is difficult to employ machine learning (ML) techniques directly to raw (unstructured) data because of class imbalance problem and possible fault-slippage through misclassification of fault. Aim: The aim of this research is to solve this problem with the help of ensemble approach and priority analysis to achieve significant accuracy in determining true-fault and false-positive reviews without losing any listed fault. Method: We conducted empirical experiment using two trained models (with reviews from inspection domain vs. movies domain) to address class imbalance problem. Our approach uses ensemble methods to develop classification confidence of inspection reviews and assigns them to appropriate priority class. Results: The results showed that movies trained model performed better than inspection trained and restricted any possible fault-slippage.",
keywords = "class imbalance, ensemble, Fault priority, fault slippage, inspections reviews, machine learning, part of speech, sampling",
author = "Maninder Singh and Walia, {Gursimran S.} and Anurag Goswami",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 2017 International Conference on Machine Learning and Data Science, MLDS 2017 ; Conference date: 14-12-2017 Through 15-12-2017",
year = "2018",
month = mar,
day = "19",
doi = "10.1109/MLDS.2017.15",
language = "English (US)",
series = "Proceedings - 2017 International Conference on Machine Learning and Data Science, MLDS 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "15--22",
booktitle = "Proceedings - 2017 International Conference on Machine Learning and Data Science, MLDS 2017",
}