{"id":"https://openalex.org/W4415745957","doi":"https://doi.org/10.1109/icsme64153.2025.00035","title":"Are Classical Clone Detectors Good Enough for the AI Era?","display_name":"Are Classical Clone Detectors Good Enough for the AI Era?","publication_year":2025,"publication_date":"2025-09-07","ids":{"openalex":"https://openalex.org/W4415745957","doi":"https://doi.org/10.1109/icsme64153.2025.00035"},"language":null,"primary_location":{"id":"doi:10.1109/icsme64153.2025.00035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsme64153.2025.00035","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Software Maintenance and Evolution (ICSME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036373244","display_name":"Ajmain Inqiad Alam","orcid":null},"institutions":[{"id":"https://openalex.org/I32625721","display_name":"University of Saskatchewan","ror":"https://ror.org/010x8gc63","country_code":"CA","type":"education","lineage":["https://openalex.org/I32625721"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Ajmain I. Alam","raw_affiliation_strings":["University of Saskatchewan,Department of Computer Science,Saskatoon,Canada"],"affiliations":[{"raw_affiliation_string":"University of Saskatchewan,Department of Computer Science,Saskatoon,Canada","institution_ids":["https://openalex.org/I32625721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058812722","display_name":"Palash Ranjan Roy","orcid":"https://orcid.org/0000-0001-9470-4233"},"institutions":[{"id":"https://openalex.org/I32625721","display_name":"University of Saskatchewan","ror":"https://ror.org/010x8gc63","country_code":"CA","type":"education","lineage":["https://openalex.org/I32625721"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Palash R. Roy","raw_affiliation_strings":["University of Saskatchewan,Department of Computer Science,Saskatoon,Canada"],"affiliations":[{"raw_affiliation_string":"University of Saskatchewan,Department of Computer Science,Saskatoon,Canada","institution_ids":["https://openalex.org/I32625721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025479495","display_name":"Farouq Al-omari","orcid":null},"institutions":[{"id":"https://openalex.org/I160262251","display_name":"Thompson Rivers University","ror":"https://ror.org/01v9wj339","country_code":"CA","type":"education","lineage":["https://openalex.org/I160262251"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Farouq Al-omari","raw_affiliation_strings":["Thompson Rivers University,Department of Engineering,Kamloops,Canada"],"affiliations":[{"raw_affiliation_string":"Thompson Rivers University,Department of Engineering,Kamloops,Canada","institution_ids":["https://openalex.org/I160262251"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102756770","display_name":"Chanchal K. Roy","orcid":"https://orcid.org/0000-0003-0519-6164"},"institutions":[{"id":"https://openalex.org/I32625721","display_name":"University of Saskatchewan","ror":"https://ror.org/010x8gc63","country_code":"CA","type":"education","lineage":["https://openalex.org/I32625721"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Chanchal K. Roy","raw_affiliation_strings":["University of Saskatchewan,Department of Computer Science,Saskatoon,Canada"],"affiliations":[{"raw_affiliation_string":"University of Saskatchewan,Department of Computer Science,Saskatoon,Canada","institution_ids":["https://openalex.org/I32625721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015470184","display_name":"Banani Roy","orcid":"https://orcid.org/0000-0003-1247-7781"},"institutions":[{"id":"https://openalex.org/I32625721","display_name":"University of Saskatchewan","ror":"https://ror.org/010x8gc63","country_code":"CA","type":"education","lineage":["https://openalex.org/I32625721"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Banani Roy","raw_affiliation_strings":["University of Saskatchewan,Department of Computer Science,Saskatoon,Canada"],"affiliations":[{"raw_affiliation_string":"University of Saskatchewan,Department of Computer Science,Saskatoon,Canada","institution_ids":["https://openalex.org/I32625721"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089178328","display_name":"Kevin A. Schneider","orcid":"https://orcid.org/0000-0003-1113-1754"},"institutions":[{"id":"https://openalex.org/I32625721","display_name":"University of Saskatchewan","ror":"https://ror.org/010x8gc63","country_code":"CA","type":"education","lineage":["https://openalex.org/I32625721"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Kevin A. Schneider","raw_affiliation_strings":["University of Saskatchewan,Department of Computer Science,Saskatoon,Canada"],"affiliations":[{"raw_affiliation_string":"University of Saskatchewan,Department of Computer Science,Saskatoon,Canada","institution_ids":["https://openalex.org/I32625721"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5036373244"],"corresponding_institution_ids":["https://openalex.org/I32625721"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45079287,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"295","last_page":"307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.002199999988079071,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.0020000000949949026,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.7542999982833862},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5853999853134155},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5292999744415283},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5192000269889832},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.5026000142097473},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4742000102996826},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4690999984741211}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7633000016212463},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7542999982833862},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5853999853134155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5299000144004822},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5292999744415283},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5192000269889832},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.5026000142097473},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4936999976634979},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4742000102996826},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4690999984741211},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.43299999833106995},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4025999903678894},{"id":"https://openalex.org/C81089528","wikidata":"https://www.wikidata.org/wiki/Q5134986","display_name":"clone (Java method)","level":3,"score":0.35850000381469727},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.32600000500679016},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.3025999963283539},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29030001163482666},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2614000141620636},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2572999894618988}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icsme64153.2025.00035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsme64153.2025.00035","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Software Maintenance and Evolution (ICSME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W1512615396","https://openalex.org/W1593203335","https://openalex.org/W1964788505","https://openalex.org/W1967028047","https://openalex.org/W1993673250","https://openalex.org/W1999404243","https://openalex.org/W2003285370","https://openalex.org/W2025962632","https://openalex.org/W2048382152","https://openalex.org/W2065053490","https://openalex.org/W2096491586","https://openalex.org/W2100060170","https://openalex.org/W2101832700","https://openalex.org/W2102543548","https://openalex.org/W2104301886","https://openalex.org/W2120319185","https://openalex.org/W2120326119","https://openalex.org/W2125260159","https://openalex.org/W2128782367","https://openalex.org/W2128888088","https://openalex.org/W2131477050","https://openalex.org/W2151573418","https://openalex.org/W2158439356","https://openalex.org/W2162436321","https://openalex.org/W2165739648","https://openalex.org/W2511803001","https://openalex.org/W2578208870","https://openalex.org/W2621103691","https://openalex.org/W2741705590","https://openalex.org/W2945440850","https://openalex.org/W2955426500","https://openalex.org/W3012514498","https://openalex.org/W3013132080","https://openalex.org/W3014339000","https://openalex.org/W3098605233","https://openalex.org/W3198948396","https://openalex.org/W3208543970","https://openalex.org/W3212083716","https://openalex.org/W4242739280","https://openalex.org/W4312691425","https://openalex.org/W4312803897","https://openalex.org/W4312874104","https://openalex.org/W4319451764","https://openalex.org/W4382793287","https://openalex.org/W4384302844","https://openalex.org/W4385784149","https://openalex.org/W4386142439","https://openalex.org/W4388212271","https://openalex.org/W4388954848","https://openalex.org/W4389544307","https://openalex.org/W4393034946","https://openalex.org/W4394597263","https://openalex.org/W4406495600"],"related_works":[],"abstract_inverted_index":{"The":[0,218],"increasing":[1],"adoption":[2],"of":[3,88,197,224],"AI-generated":[4,23,71,140,160,182],"code":[5,44,72],"has":[6],"reshaped":[7],"modern":[8,247],"software":[9],"development,":[10],"introducing":[11],"syntactic":[12,27,62,76],"and":[13,29,58,65,77,116,130,139,191,204,209,228,238],"semantic":[14,30,67,79],"variations":[15],"in":[16,135,200,245],"cloned":[17],"code.":[18],"Unlike":[19],"traditional":[20,138,170],"human-written":[21],"clones,":[22,80,161,183],"clones":[24],"exhibit":[25,164],"systematic":[26],"patterns":[28],"differences":[31,134],"learned":[32],"from":[33],"largescale":[34],"training":[35],"data.":[36],"This":[37,172],"shift":[38],"presents":[39],"new":[40,94],"challenges":[41],"for":[42],"classical":[43,89,146,178,225,237],"clone":[45,243],"detection":[46,202,244],"(CCD)":[47],"tools,":[48,148],"which":[49],"have":[50],"historically":[51],"been":[52],"validated":[53],"primarily":[54],"on":[55,125],"human-authored":[56,127],"codebases":[57],"optimized":[59],"to":[60,84,132,169,212,241],"detect":[61],"(Type":[63],"1-3)":[64],"limited":[66],"clones.":[68,113,141],"Given":[69],"that":[70,145,234],"can":[73],"produce":[74],"both":[75,236],"complex":[78],"it":[81],"is":[82],"essential":[83],"evaluate":[85,101],"the":[86,195,221,246],"effectiveness":[87,158],"CCD":[90,105,147,179,215,226],"tools":[91,106,180,227],"within":[92],"this":[93,97],"paradigm.":[95],"In":[96],"paper,":[98],"we":[99,120],"systematically":[100],"nine":[102],"widely":[103],"used":[104],"using":[107],"GPTCloneBench,":[108],"a":[109,231],"benchmark":[110],"containing":[111],"GPT-3-generated":[112],"To":[114],"contextualize":[115],"validate":[117],"our":[118],"results,":[119],"further":[121],"test":[122],"these":[123],"detectors":[124],"established":[126],"benchmarks,":[128],"BigCloneBench":[129],"SemanticCloneBench,":[131],"measure":[133],"performance":[136,166],"between":[137],"Our":[142],"analysis":[143],"demonstrates":[144],"particularly":[149],"those":[150],"enhanced":[151],"by":[152,175],"effective":[153],"normalization":[154,198],"techniques,":[155],"retain":[156],"considerable":[157],"against":[159,181],"while":[162],"some":[163],"notable":[165],"variation":[167],"compared":[168],"benchmarks.":[171],"paper":[173],"contributes":[174],"(1)":[176],"evaluating":[177],"providing":[184],"critical":[185],"insights":[186],"into":[187],"their":[188],"current":[189],"strengths":[190],"limitations;":[192],"(2)":[193],"highlighting":[194],"role":[196],"techniques":[199],"improving":[201],"accuracy;":[203],"(3)":[205],"delivering":[206],"detailed":[207],"scalability":[208],"execution-time":[210],"analyses":[211],"support":[213],"practical":[214],"tool":[216],"selection.":[217],"research":[219],"underscores":[220],"continued":[222],"relevance":[223],"suggests":[229],"adopting":[230],"hybrid":[232],"approach":[233],"combines":[235],"AI-based":[239],"methods":[240],"improve":[242],"era.":[248]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-31T00:00:00"}
