@article{Cynthia-2022-Feature,
title = "Feature Transformation for Improved Software Bug Detection Models",
author = "Cynthia, Shamse Tasnim and
Roy, Banani and
Mondal, Debajyoti",
journal = "15th Innovations in Software Engineering Conference",
year = "2022",
publisher = "ACM",
url = "https://gwf-uwaterloo.github.io/gwf-publications/G22-9002",
doi = "10.1145/3511430.3511444",
abstract = "Testing software is considered to be one of the most crucial phases in software development life cycle. Software bug fixing requires a significant amount of time and effort. A rich body of recent research explored ways to predict bugs in software artifacts using machine learning based techniques. For a reliable and trustworthy prediction, it is crucial to also consider the explainability aspects of such machine learning models. In this paper, we show how the feature transformation techniques can significantly improve the prediction accuracy and build confidence in building bug prediction models. We propose a novel approach for improved bug prediction that first extracts the features, then finds a weighted transformation of these features using a genetic algorithm that best separates bugs from non-bugs when plotted in a low-dimensional space, and finally, trains the machine learning model using the transformed dataset. In our experiment with real-life bug datasets, the random forest and k-nearest neighbor classifier models that leveraged feature transformation showed 4.25{\%} improvement in recall values on an average of over 8 software systems when compared to the models built on original data.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="Cynthia-2022-Feature">
<titleInfo>
<title>Feature Transformation for Improved Software Bug Detection Models</title>
</titleInfo>
<name type="personal">
<namePart type="given">Shamse</namePart>
<namePart type="given">Tasnim</namePart>
<namePart type="family">Cynthia</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Banani</namePart>
<namePart type="family">Roy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Debajyoti</namePart>
<namePart type="family">Mondal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2022</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>15th Innovations in Software Engineering Conference</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>ACM</publisher>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>Testing software is considered to be one of the most crucial phases in software development life cycle. Software bug fixing requires a significant amount of time and effort. A rich body of recent research explored ways to predict bugs in software artifacts using machine learning based techniques. For a reliable and trustworthy prediction, it is crucial to also consider the explainability aspects of such machine learning models. In this paper, we show how the feature transformation techniques can significantly improve the prediction accuracy and build confidence in building bug prediction models. We propose a novel approach for improved bug prediction that first extracts the features, then finds a weighted transformation of these features using a genetic algorithm that best separates bugs from non-bugs when plotted in a low-dimensional space, and finally, trains the machine learning model using the transformed dataset. In our experiment with real-life bug datasets, the random forest and k-nearest neighbor classifier models that leveraged feature transformation showed 4.25% improvement in recall values on an average of over 8 software systems when compared to the models built on original data.</abstract>
<identifier type="citekey">Cynthia-2022-Feature</identifier>
<identifier type="doi">10.1145/3511430.3511444</identifier>
<location>
<url>https://gwf-uwaterloo.github.io/gwf-publications/G22-9002</url>
</location>
<part>
<date>2022</date>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T Feature Transformation for Improved Software Bug Detection Models
%A Cynthia, Shamse Tasnim
%A Roy, Banani
%A Mondal, Debajyoti
%J 15th Innovations in Software Engineering Conference
%D 2022
%I ACM
%F Cynthia-2022-Feature
%X Testing software is considered to be one of the most crucial phases in software development life cycle. Software bug fixing requires a significant amount of time and effort. A rich body of recent research explored ways to predict bugs in software artifacts using machine learning based techniques. For a reliable and trustworthy prediction, it is crucial to also consider the explainability aspects of such machine learning models. In this paper, we show how the feature transformation techniques can significantly improve the prediction accuracy and build confidence in building bug prediction models. We propose a novel approach for improved bug prediction that first extracts the features, then finds a weighted transformation of these features using a genetic algorithm that best separates bugs from non-bugs when plotted in a low-dimensional space, and finally, trains the machine learning model using the transformed dataset. In our experiment with real-life bug datasets, the random forest and k-nearest neighbor classifier models that leveraged feature transformation showed 4.25% improvement in recall values on an average of over 8 software systems when compared to the models built on original data.
%R 10.1145/3511430.3511444
%U https://gwf-uwaterloo.github.io/gwf-publications/G22-9002
%U https://doi.org/10.1145/3511430.3511444
Markdown (Informal)
[Feature Transformation for Improved Software Bug Detection Models](https://gwf-uwaterloo.github.io/gwf-publications/G22-9002) (Cynthia et al., GWF 2022)
ACL
- Shamse Tasnim Cynthia, Banani Roy, and Debajyoti Mondal. 2022. Feature Transformation for Improved Software Bug Detection Models. 15th Innovations in Software Engineering Conference.