{"id":"https://openalex.org/W4415034616","doi":"https://doi.org/10.1109/scam67354.2025.00021","title":"Challenging Bug Prediction and Repair Models with Synthetic Bugs","display_name":"Challenging Bug Prediction and Repair Models with Synthetic Bugs","publication_year":2025,"publication_date":"2025-09-08","ids":{"openalex":"https://openalex.org/W4415034616","doi":"https://doi.org/10.1109/scam67354.2025.00021"},"language":"en","primary_location":{"id":"doi:10.1109/scam67354.2025.00021","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scam67354.2025.00021","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Source Code Analysis &amp;amp; Manipulation (SCAM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028705274","display_name":"Ali Reza Ibrahimzada","orcid":"https://orcid.org/0000-0002-3797-818X"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ali Reza Ibrahimzada","raw_affiliation_strings":["University of Illinois Urbana-Champaign,Urbana,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,Urbana,IL,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019580960","display_name":"Yang Chen","orcid":"https://orcid.org/0009-0008-1409-4163"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yang Chen","raw_affiliation_strings":["University of Illinois Urbana-Champaign,Urbana,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,Urbana,IL,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108306647","display_name":"Ryan Rong","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Rong","raw_affiliation_strings":["Stanford University,Stanford,CA,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stanford University,Stanford,CA,USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058824250","display_name":"Reyhaneh Jabbarvand","orcid":"https://orcid.org/0000-0002-0668-8526"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Reyhaneh Jabbarvand","raw_affiliation_strings":["University of Illinois Urbana-Champaign,Urbana,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,Urbana,IL,USA","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.3589,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91642554,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"133","last_page":"144"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9247999787330627,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9247999787330627,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11750","display_name":"Phytoplasmas and Hemiptera pathogens","score":0.9014999866485596,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-bug","display_name":"Software bug","score":0.6403999924659729},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5936999917030334},{"id":"https://openalex.org/keywords/software-regression","display_name":"Software regression","score":0.555400013923645},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5177000164985657},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.5131999850273132},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.460999995470047},{"id":"https://openalex.org/keywords/security-bug","display_name":"Security bug","score":0.4219000041484833},{"id":"https://openalex.org/keywords/software-inspection","display_name":"Software inspection","score":0.4171999990940094},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4097999930381775},{"id":"https://openalex.org/keywords/code-refactoring","display_name":"Code refactoring","score":0.4047999978065491}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7135999798774719},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.6403999924659729},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5936999917030334},{"id":"https://openalex.org/C191727507","wikidata":"https://www.wikidata.org/wiki/Q24346","display_name":"Software regression","level":5,"score":0.555400013923645},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5177000164985657},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.5131999850273132},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.460999995470047},{"id":"https://openalex.org/C131275738","wikidata":"https://www.wikidata.org/wiki/Q7445023","display_name":"Security bug","level":5,"score":0.4219000041484833},{"id":"https://openalex.org/C10272871","wikidata":"https://www.wikidata.org/wiki/Q929972","display_name":"Software inspection","level":5,"score":0.4171999990940094},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4097999930381775},{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.4047999978065491},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.3817000091075897},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3617999851703644},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3529999852180481},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34279999136924744},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.3310000002384186},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.328900009393692},{"id":"https://openalex.org/C53942775","wikidata":"https://www.wikidata.org/wiki/Q1211721","display_name":"Code coverage","level":3,"score":0.3228999972343445},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3158000111579895},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.3100000023841858},{"id":"https://openalex.org/C101317890","wikidata":"https://www.wikidata.org/wiki/Q940053","display_name":"Software maintenance","level":4,"score":0.3050000071525574},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.30090001225471497},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.29269999265670776},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.28700000047683716},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.27140000462532043},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.2648000121116638},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.2531999945640564},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/scam67354.2025.00021","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scam67354.2025.00021","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Source Code Analysis &amp;amp; Manipulation (SCAM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1655956671","https://openalex.org/W1963523113","https://openalex.org/W2014011458","https://openalex.org/W2156723666","https://openalex.org/W2170260129","https://openalex.org/W2466388701","https://openalex.org/W2587741066","https://openalex.org/W2739564891","https://openalex.org/W2795260929","https://openalex.org/W2956069715","https://openalex.org/W2993007949","https://openalex.org/W3011190810","https://openalex.org/W3091588759","https://openalex.org/W3098605233","https://openalex.org/W3160691259","https://openalex.org/W3183469243","https://openalex.org/W3195156628","https://openalex.org/W3198685994","https://openalex.org/W4281763794","https://openalex.org/W4285490453","https://openalex.org/W4308643033","https://openalex.org/W4308731473","https://openalex.org/W4313563424","https://openalex.org/W4384154386","https://openalex.org/W4384345705","https://openalex.org/W4385245566","https://openalex.org/W4388483599","https://openalex.org/W4394769102","https://openalex.org/W4402457499","https://openalex.org/W4411450037"],"related_works":[],"abstract_inverted_index":{"Bugs":[0],"are":[1,36,98,181,265],"essential":[2],"in":[3,9,22,64,124,140,221,261],"software":[4,23,51],"engineering;":[5],"many":[6],"research":[7],"studies":[8],"the":[10,49,61,77,125,137,141,158,164,170,176,232,237],"past":[11],"decades":[12],"have":[13,131],"been":[14],"proposed":[15],"to":[16,38,44,70,109,136,144,150,184,190,193,198,208,229,267,275,296,309,326],"detect,":[17],"localize,":[18],"and":[19,42,72,86,95,182,203,215,254,281,285,291,294,311,315],"repair":[20,45,204,297,302,305],"bugs":[21,192,246,263],"systems.":[24],"Effectiveness":[25],"evaluation":[26,243],"of":[27,54,117,244,313],"such":[28],"techniques":[29,189],"requires":[30],"complex":[31],"bugs,":[32,75,97],"i.e.,":[33,92,321],"those":[34],"that":[35,264],"hard":[37,43,69,266,295],"detect":[39,268],"through":[40,46],"testing":[41],"debugging.":[47],"From":[48],"classic":[50],"engineering":[52],"point":[53],"view,":[55],"a":[56,101,114,132,146,162,166,328],"hard-to-repair":[57,96,154,216],"bug":[58,102,129,147,155,167,196,201,271],"differs":[59,168],"from":[60,169,247],"correct":[62,138],"code":[63,134,139,172,211,220,329],"multiple":[65,107,174,213,222],"locations,":[66],"making":[67],"it":[68,322],"localize":[71],"repair.":[73],"Hard-to-detect":[74],"on":[76],"other":[78],"hand,":[79],"manifest":[80],"themselves":[81],"under":[82,113],"specific":[83,115],"test":[84],"inputs":[85],"reachability":[87],"conditions.":[88],"These":[89],"two":[90,121,255],"objectives,":[91],"generating":[93,262],"hard-to-detect":[94,214],"mostly":[99],"aligned;":[100],"generation":[103],"technique":[104,303],"can":[105],"change":[106,231],"statements":[108],"be":[110],"covered":[111],"only":[112,230],"set":[116],"inputs.":[118],"However,":[119],"these":[120],"objectives":[122],"conflict":[123],"learning-based":[126,200,270,300],"techniques:":[127],"A":[128],"should":[130],"similar":[133],"representation":[135],"training":[142,332],"data":[143],"challenge":[145,199],"prediction":[148,202,272],"model":[149,239],"distinguish":[151],"them.":[152],"The":[153],"definition":[156],"remains":[157],"same":[159],"but":[160,225],"with":[161,330],"caveat:":[163],"more":[165,177],"original":[171],"(at":[173],"locations),":[175],"distant":[178],"their":[179],"representations":[180],"easier":[183],"detect.":[185],"This":[186],"demands":[187],"new":[188],"generate":[191],"complement":[194],"existing":[195],"datasets":[197],"techniques.(p)(/p)We":[205],"propose":[206],"BugFarm":[207,218,253,318],"transform":[209],"arbitrary":[210],"into":[212],"bugs.":[217],"mutates":[219],"locations":[223,235],"(hard-to-repair)":[224],"leverages":[226],"attention":[227],"analysis":[228],"least":[233],"attended":[234],"by":[236,252,269,298],"underlying":[238],"(hard-to-detect).":[240],"Our":[241],"comprehensive":[242],"435k+":[245],"over":[248],"1.9M":[249],"mutants":[250],"generated":[251],"alternative":[256],"approaches":[257,273],"demonstrates":[258],"our":[259],"superiority":[260],"(up":[274],"40.53%":[276],"higher":[277],"False":[278],"Negative":[279],"Rate":[280],"10.76%,":[282],"5.2%,":[283],"28.93%,":[284],"20.53%":[286],"lower":[287],"Accuracy,":[288],"Precision,":[289],"Recall,":[290],"F1":[292],"score)":[293],"state-of-the-art":[299],"program":[301],"(28%":[304],"success":[306],"rate":[307],"compared":[308],"36%":[310],"49%":[312],"LEAM":[314],"\u03bcBERT":[316],"bugs).":[317],"is":[319],"efficient,":[320],"takes":[323],"nine":[324],"seconds":[325],"mutate":[327],"no":[331],"overhead.":[333]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
