{"id":"https://openalex.org/W7125910738","doi":"https://doi.org/10.1109/smc58881.2025.11342537","title":"Semantic SZZ: Mitigating the Impact of Misclassified Corrective Changes in Just-in-Time Software Defect Prediction","display_name":"Semantic SZZ: Mitigating the Impact of Misclassified Corrective Changes in Just-in-Time Software Defect Prediction","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125910738","doi":"https://doi.org/10.1109/smc58881.2025.11342537"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11342537","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342537","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082285551","display_name":"Ronaldo C. Veras","orcid":null},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Ronaldo C. Veras","raw_affiliation_strings":["Federal University of Pernambuco,Center for Informatics,Recife,Brazil"],"affiliations":[{"raw_affiliation_string":"Federal University of Pernambuco,Center for Informatics,Recife,Brazil","institution_ids":["https://openalex.org/I25112270"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070984576","display_name":"George G. Cabral","orcid":"https://orcid.org/0000-0003-2831-4274"},"institutions":[{"id":"https://openalex.org/I62921916","display_name":"Universidade Federal Rural de Pernambuco","ror":"https://ror.org/02ksmb993","country_code":"BR","type":"education","lineage":["https://openalex.org/I62921916"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"George G. Cabral","raw_affiliation_strings":["Federal Rural University of Pernambuco,Department of Computing,Recife,Brazil"],"affiliations":[{"raw_affiliation_string":"Federal Rural University of Pernambuco,Department of Computing,Recife,Brazil","institution_ids":["https://openalex.org/I62921916"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035927976","display_name":"A. T. C. Oliveira","orcid":null},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Adriano L. I. Oliveira","raw_affiliation_strings":["Federal University of Pernambuco,Center for Informatics,Recife,Brazil"],"affiliations":[{"raw_affiliation_string":"Federal University of Pernambuco,Center for Informatics,Recife,Brazil","institution_ids":["https://openalex.org/I25112270"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5082285551"],"corresponding_institution_ids":["https://openalex.org/I25112270"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.84927961,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"769","last_page":"774"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.003700000001117587,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.00139999995008111,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/commit","display_name":"Commit","score":0.8866999745368958},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6758000254631042},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5892999768257141},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4959000051021576},{"id":"https://openalex.org/keywords/software-bug","display_name":"Software bug","score":0.41029998660087585},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.3986000120639801}],"concepts":[{"id":"https://openalex.org/C153180980","wikidata":"https://www.wikidata.org/wiki/Q19776675","display_name":"Commit","level":2,"score":0.8866999745368958},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6758000254631042},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6714000105857849},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5892999768257141},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4959000051021576},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4652999937534332},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.41029998660087585},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.3986000120639801},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.3497999906539917},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34299999475479126},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3151000142097473},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.30070000886917114},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.3003000020980835},{"id":"https://openalex.org/C101317890","wikidata":"https://www.wikidata.org/wiki/Q940053","display_name":"Software maintenance","level":4,"score":0.2784999907016754},{"id":"https://openalex.org/C82214349","wikidata":"https://www.wikidata.org/wiki/Q657339","display_name":"Software metric","level":5,"score":0.2705000042915344},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2646999955177307},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2587999999523163}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11342537","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342537","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.6729430556297302}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2068714596","https://openalex.org/W2082183626","https://openalex.org/W2147386665","https://openalex.org/W2276400542","https://openalex.org/W2729440153","https://openalex.org/W2796283679","https://openalex.org/W2955232136","https://openalex.org/W2997546679","https://openalex.org/W3134816784","https://openalex.org/W3162494388","https://openalex.org/W3213259750","https://openalex.org/W4285229502","https://openalex.org/W4400959040"],"related_works":[],"abstract_inverted_index":{"In":[0],"the":[1,25,63,68,73,99,109,112,124,139,144],"evolving":[2],"landscape":[3],"of":[4,9,43,67,90,101,114,129,138],"software":[5,16],"engineering,":[6],"accurate":[7],"identification":[8,54],"defect-inducing":[10,115],"commits":[11,35,53,91,102,116],"is":[12,31],"critical":[13],"to":[14,40,76,98,123,150],"improving":[15],"quality":[17],"and":[18],"reducing":[19],"development":[20],"costs.":[21],"This":[22],"paper":[23],"revisits":[24],"widely":[26],"adopted":[27],"SZZ":[28,74,141],"algorithm,":[29],"which":[30],"utilized":[32],"for":[33,84,108],"labeling":[34,142],"as":[36,94,103,135],"clean":[37],"or":[38],"defect-inducing,":[39],"address":[41],"one":[42],"its":[44,48],"main":[45],"limitations,":[46],"i.e.,":[47],"reliance":[49],"on":[50],"outdated":[51],"corrective":[52],"strategies.":[55],"We":[56],"propose":[57],"an":[58,106],"innovative":[59],"approach":[60],"that":[61],"integrates":[62],"semantic":[64],"understanding":[65],"capability":[66],"GPT":[69],"OpenAI":[70],"model":[71],"into":[72],"flow":[75],"better":[77],"interpret":[78],"commit":[79],"messages.":[80],"Our":[81],"experiments":[82,131],"reveal,":[83],"some":[85],"projects,":[86],"a":[87,136],"large":[88],"number":[89,113],"incorrectly":[92],"interpreted":[93],"defect-fixing,":[95],"consequently,":[96],"leading":[97],"misclassification":[100],"defect-inducing.":[104],"As":[105],"example,":[107],"Postgresql":[110],"dataset,":[111],"was":[117],"reduced":[118],"in":[119],"21%":[120],"when":[121],"compared":[122],"original":[125],"SZZ.":[126],"Furthermore,":[127],"results":[128],"our":[130],"strongly":[132],"suggest":[133],"that,":[134],"result":[137],"proposed":[140],"process,":[143],"JIT-SDP":[145],"problem":[146],"has":[147],"been":[148],"shown":[149],"be":[151],"more":[152],"challenging":[153],"than":[154],"originally":[155],"reported":[156],"by":[157],"previous":[158],"works.":[159]},"counts_by_year":[],"updated_date":"2026-01-29T23:17:01.242718","created_date":"2026-01-29T00:00:00"}
