by Hannes Thaller, Lukas Linsbauer, Alexander Egyed
Abstract:
Semantic clones are program components with similar behavior, but different textual representation. Semantic similarity is hard to detect, and semantic clone detection is still an open issue. We present semantic clone detection via Probabilistic Software Modeling (PSM) as a robust method for detecting semantically equivalent methods. PSM inspects the structure and runtime behavior of a program and synthesizes a network of Probabilistic Models (PMs). Each PM in the network represents a method in the program and is capable of generating and evaluating runtime events. We leverage these capabilities to accurately find semantic clones. Results show that the approach can detect semantic clones in the complete absence of syntactic similarity with high precision and low error rates.
Reference:
Towards Semantic Clone Detection via Probabilistic Software Modeling (Hannes Thaller, Lukas Linsbauer, Alexander Egyed), In CoRR, volume abs/2001.07399, 2020.
Bibtex Entry:
@Article{DBLP:journals/corr/abs-2001-07399,
author = {Hannes Thaller and Lukas Linsbauer and Alexander Egyed},
journal = {CoRR},
title = {Towards Semantic Clone Detection via Probabilistic Software Modeling},
year = {2020},
volume = {abs/2001.07399},
abstract = {Semantic clones are program components with similar behavior, but different textual representation. Semantic similarity is hard to detect, and semantic clone detection is still an open issue. We present semantic clone detection via Probabilistic Software Modeling (PSM) as a robust method for detecting semantically equivalent methods. PSM inspects the structure and runtime behavior of a program and synthesizes a network of Probabilistic Models (PMs). Each PM in the network represents a method in the program and is capable of generating and evaluating runtime events. We leverage these capabilities to accurately find semantic clones. Results show that the approach can detect semantic clones in the complete absence of syntactic similarity with high precision and low error rates.},
archiveprefix = {arXiv},
bibsource = {dblp computer science bibliography, https://dblp.org},
biburl = {https://dblp.org/rec/journals/corr/abs-2001-07399.bib},
eprint = {2001.07399},
file = {:Journals/CORR 2020 - Semantic Clone Detectionvia Probabilistic Software Modeling/Semantic Clone Detection via Probabilistic Software Modeling-preprint.pdf:PDF},
keywords = {SCCH},
timestamp = {Fri, 24 Jan 2020 15:00:57 +0100},
url = {https://arxiv.org/abs/2001.07399},
}