
@Article{	  eInformatica2026Art05,
  author	= {Zdenek Tronicek},
  title		= {Index-Based Type-3 Clone Detection},
  doi		= {10.37190/e-Inf260105},
  year		= {2026},
  volume	= {20},
  number	= {1},
  keywords	= {clone detection, code clones, near-miss clones},
  journal	= {e-Informatica Software Engineering Journal},
  url		= {https://www.e-informatyka.pl/EISEJ/papers/2026/1/5/},
  abstract	= { Context: Clone detection is a common task in software engineering. Type-3 clones are fragments of code that can be slightly different in structure. Objective: The article presents a~new algorithm for Type-3 clone detection, its open-source implementation called DrDupLex3, and novel open-source tools that can be used for the automated assessment of Type-3 clones and to prepare training sets for machine learning-based clone detectors.Method: The algorithm for Type-3 clone detection builds upon the index of source code used in DrDupLex, the most accurate Type-2 clone detector to date.Results: A comparison with three state-of-the-art clone detectors (NiCad, CloneWorks, and SourcererCC) shows that DrDupLex3 is able to outperform them in precision, recall, and running time. It reported no false positives and found all clones reported by NiCad, CloneWorks, and SourcererCC.Conclusions: The presented clone detector outperforms three state-of-the-art competitors in a~scenario that can be easily repeated because it is based on tools for automated assessment of Type-3 clones. },
  note		= {Available online: 23 Apr. 2026},
  month		= apr,
  pages		= {260105}
}
