@article{Mondal-2021-ID-correspondence:,
title = "ID-correspondence: a measure for detecting evolutionary coupling",
author = "Mondal, Manishankar and
Roy, Banani and
Roy, Chanchal K. and
Schneider, Kevin A.",
journal = "Empirical Software Engineering, Volume 26, Issue 1",
volume = "26",
number = "1",
year = "2021",
publisher = "Springer Science and Business Media LLC",
url = "https://gwf-uwaterloo.github.io/gwf-publications/G21-23001",
doi = "10.1007/s10664-020-09921-9",
abstract = "Evolutionary coupling is a well investigated phenomenon in software maintenance research and practice. Association rules and two related measures, support and confidence, have been used to identify evolutionary coupling among program entities. However, these measures only emphasize the co-change (i.e., changing together) frequency of entities and cannot determine whether the entities co-evolved by experiencing related changes. Consequently, the approach reports false positives and fails to detect evolutionary coupling among infrequently co-changed entities. We propose a new measure, identifier correspondence (id-correspondence), that quantifies the extent to which changes that occurred to the co-changed entities are related based on identifier similarity. Identifiers are the names given to different program entities such as variables, methods, classes, packages, interfaces, structures, unions etc. We use Dice-S{\o}rensen co-efficient for measuring lexical similarity between the identifiers involved in the changed lines of the co-changed entities. Our investigation on thousands of revisions from nine subject systems covering three programming languages shows that id-correspondence can considerably improve the detection accuracy of evolutionary coupling. It outperforms the existing state-of-the-art evolutionary coupling based techniques with significantly higher recall and F-score in predicting future co-change candidates.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="Mondal-2021-ID-correspondence:">
<titleInfo>
<title>ID-correspondence: a measure for detecting evolutionary coupling</title>
</titleInfo>
<name type="personal">
<namePart type="given">Manishankar</namePart>
<namePart type="family">Mondal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Banani</namePart>
<namePart type="family">Roy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chanchal</namePart>
<namePart type="given">K</namePart>
<namePart type="family">Roy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kevin</namePart>
<namePart type="given">A</namePart>
<namePart type="family">Schneider</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Empirical Software Engineering, Volume 26, Issue 1</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>Springer Science and Business Media LLC</publisher>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>Evolutionary coupling is a well investigated phenomenon in software maintenance research and practice. Association rules and two related measures, support and confidence, have been used to identify evolutionary coupling among program entities. However, these measures only emphasize the co-change (i.e., changing together) frequency of entities and cannot determine whether the entities co-evolved by experiencing related changes. Consequently, the approach reports false positives and fails to detect evolutionary coupling among infrequently co-changed entities. We propose a new measure, identifier correspondence (id-correspondence), that quantifies the extent to which changes that occurred to the co-changed entities are related based on identifier similarity. Identifiers are the names given to different program entities such as variables, methods, classes, packages, interfaces, structures, unions etc. We use Dice-Sørensen co-efficient for measuring lexical similarity between the identifiers involved in the changed lines of the co-changed entities. Our investigation on thousands of revisions from nine subject systems covering three programming languages shows that id-correspondence can considerably improve the detection accuracy of evolutionary coupling. It outperforms the existing state-of-the-art evolutionary coupling based techniques with significantly higher recall and F-score in predicting future co-change candidates.</abstract>
<identifier type="citekey">Mondal-2021-ID-correspondence:</identifier>
<identifier type="doi">10.1007/s10664-020-09921-9</identifier>
<location>
<url>https://gwf-uwaterloo.github.io/gwf-publications/G21-23001</url>
</location>
<part>
<date>2021</date>
<detail type="volume"><number>26</number></detail>
<detail type="issue"><number>1</number></detail>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T ID-correspondence: a measure for detecting evolutionary coupling
%A Mondal, Manishankar
%A Roy, Banani
%A Roy, Chanchal K.
%A Schneider, Kevin A.
%J Empirical Software Engineering, Volume 26, Issue 1
%D 2021
%V 26
%N 1
%I Springer Science and Business Media LLC
%F Mondal-2021-ID-correspondence:
%X Evolutionary coupling is a well investigated phenomenon in software maintenance research and practice. Association rules and two related measures, support and confidence, have been used to identify evolutionary coupling among program entities. However, these measures only emphasize the co-change (i.e., changing together) frequency of entities and cannot determine whether the entities co-evolved by experiencing related changes. Consequently, the approach reports false positives and fails to detect evolutionary coupling among infrequently co-changed entities. We propose a new measure, identifier correspondence (id-correspondence), that quantifies the extent to which changes that occurred to the co-changed entities are related based on identifier similarity. Identifiers are the names given to different program entities such as variables, methods, classes, packages, interfaces, structures, unions etc. We use Dice-Sørensen co-efficient for measuring lexical similarity between the identifiers involved in the changed lines of the co-changed entities. Our investigation on thousands of revisions from nine subject systems covering three programming languages shows that id-correspondence can considerably improve the detection accuracy of evolutionary coupling. It outperforms the existing state-of-the-art evolutionary coupling based techniques with significantly higher recall and F-score in predicting future co-change candidates.
%R 10.1007/s10664-020-09921-9
%U https://gwf-uwaterloo.github.io/gwf-publications/G21-23001
%U https://doi.org/10.1007/s10664-020-09921-9
Markdown (Informal)
[ID-correspondence: a measure for detecting evolutionary coupling](https://gwf-uwaterloo.github.io/gwf-publications/G21-23001) (Mondal et al., GWF 2021)
ACL
- Manishankar Mondal, Banani Roy, Chanchal K. Roy, and Kevin A. Schneider. 2021. ID-correspondence: a measure for detecting evolutionary coupling. Empirical Software Engineering, Volume 26, Issue 1, 26(1).