{"id":"https://openalex.org/W7125956055","doi":"https://doi.org/10.1109/ase63991.2025.00038","title":"Automated Repair of Ambiguous Problem Descriptions for LLM-Based Code Generation","display_name":"Automated Repair of Ambiguous Problem Descriptions for LLM-Based Code Generation","publication_year":2025,"publication_date":"2025-11-16","ids":{"openalex":"https://openalex.org/W7125956055","doi":"https://doi.org/10.1109/ase63991.2025.00038"},"language":null,"primary_location":{"id":"doi:10.1109/ase63991.2025.00038","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00038","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122907431","display_name":"Haoxiang Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoxiang Jia","raw_affiliation_strings":["Peking University,Key Laboratory of HCST (PKU), MoE, SCS,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Key Laboratory of HCST (PKU), MoE, SCS,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040391038","display_name":"Robbie Morris","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robbie Morris","raw_affiliation_strings":["University College London,United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London,United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101610258","display_name":"He Ye","orcid":"https://orcid.org/0000-0003-4807-2110"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"He Ye","raw_affiliation_strings":["University College London,United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London,United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012165852","display_name":"Federica Sarro","orcid":"https://orcid.org/0000-0002-9146-442X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Federica Sarro","raw_affiliation_strings":["University College London,United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London,United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011184280","display_name":"Sergey Mechtaev","orcid":"https://orcid.org/0000-0001-6088-4993"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sergey Mechtaev","raw_affiliation_strings":["Peking University,Key Laboratory of HCST (PKU), MoE, SCS,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Key Laboratory of HCST (PKU), MoE, SCS,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5122907431"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.85340949,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"367","last_page":"379"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.7301999926567078,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.7301999926567078,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.11580000072717667,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.024399999529123306,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.8399999737739563},{"id":"https://openalex.org/keywords/interpretation","display_name":"Interpretation (philosophy)","score":0.5734999775886536},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5411999821662903},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5253999829292297},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.519599974155426},{"id":"https://openalex.org/keywords/natural-language-generation","display_name":"Natural language generation","score":0.4984999895095825},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.48030000925064087}],"concepts":[{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.8399999737739563},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7056000232696533},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.5734999775886536},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5411999821662903},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5253999829292297},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.519599974155426},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.4984999895095825},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.48030000925064087},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.426800012588501},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4250999987125397},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38989999890327454},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.358599990606308},{"id":"https://openalex.org/C2777363581","wikidata":"https://www.wikidata.org/wiki/Q15098235","display_name":"Harm","level":2,"score":0.3449999988079071},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.313400000333786},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3009999990463257},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.29440000653266907},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2833999991416931},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2648000121116638}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ase63991.2025.00038","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00038","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1574491227","https://openalex.org/W2044458395","https://openalex.org/W2104107939","https://openalex.org/W2144951274","https://openalex.org/W2145373440","https://openalex.org/W2373227884","https://openalex.org/W2701082322","https://openalex.org/W2788267443","https://openalex.org/W2949167262","https://openalex.org/W2998011150","https://openalex.org/W3004796001","https://openalex.org/W4206969712","https://openalex.org/W4284689801","https://openalex.org/W4311887664","https://openalex.org/W4362514913","https://openalex.org/W4384345745","https://openalex.org/W4387142599","https://openalex.org/W4396214504","https://openalex.org/W4400582518","https://openalex.org/W4402443961","https://openalex.org/W4402457546","https://openalex.org/W4411551762","https://openalex.org/W4411552046","https://openalex.org/W4411552133","https://openalex.org/W4411552726","https://openalex.org/W4411552767","https://openalex.org/W4412888527"],"related_works":[],"abstract_inverted_index":{"The":[0],"growing":[1],"use":[2],"of":[3,12,21,47,51,83,125,133,201],"large":[4],"language":[5,14],"models":[6],"(LLMs)":[7],"has":[8],"increased":[9],"the":[10,48,88,122,126,131,147,206,218],"importance":[11],"natural":[13],"(NL)":[15],"in":[16,165],"software":[17,25],"engineering.":[18],"However,":[19],"ambiguity":[20,41,100],"NL":[22,53,66],"can":[23],"harm":[24],"quality,":[26],"as":[27],"unclear":[28],"problem":[29],"descriptions":[30,226],"may":[31],"lead":[32],"to":[33,98],"incorrect":[34],"program":[35,142],"generation.":[36],"Detecting":[37],"and":[38,63,120,141,144,170,180,190],"resolving":[39],"such":[40],"is":[42,72,90],"challenging,":[43],"motivating":[44],"our":[45],"introduction":[46],"automated":[49],"repair":[50,71],"ambiguous":[52],"descriptions,":[54,202],"which":[55],"we":[56,110,156],"approach":[57,164],"by":[58,130,209,235],"reducing":[59],"code":[60,185],"generation":[61,186],"uncertainty":[62],"better":[64],"aligning":[65],"with":[67],"input\u2013output":[68],"examples.":[69],"Ambiguity":[70],"difficult":[73],"for":[74,228],"LLMs":[75,97,176],"because":[76],"they":[77],"must":[78],"understand":[79],"how":[80],"their":[81],"interpretation":[82,124],"a":[84,154,166,213],"description":[85,127,148],"changes":[86,152],"when":[87],"text":[89],"altered.":[91],"We":[92,161],"find":[93],"that":[94],"directly":[95],"prompting":[96],"clarify":[99],"often":[101],"produces":[102],"irrelevant":[103],"or":[104,195],"inconsistent":[105],"edits.":[106],"To":[107],"address":[108],"this,":[109],"decompose":[111],"this":[112,163],"task":[113],"into":[114],"two":[115],"simpler":[116],"steps:":[117],"(1)":[118],"analyzing":[119],"repairing":[121],"LLM\u2019s":[123],"\u2014":[128,137],"captured":[129],"distribution":[132,151],"programs":[134],"it":[135,172],"induces":[136],"using":[138,173],"traditional":[139],"testing":[140],"repair,":[143],"(2)":[145],"refining":[146],"based":[149],"on":[150,182,205],"via":[153],"method":[155],"call":[157],"contrastive":[158],"specification":[159],"inference.":[160],"implement":[162],"tool":[167],"called":[168],"SPEC-FIX":[169],"evaluate":[171],"four":[174],"state-of-the-art":[175],"(GPT-4o,":[177],"GPT-4o-mini,":[178],"DeepSeek-V3,":[179],"Qwen2.5-Coder-32B-Instruct)":[181],"three":[183],"popular":[184],"benchmarks":[187],"(HumanEval+,":[188],"MBPP+":[189],"LiveCodeBench).":[191],"Without":[192],"human":[193],"intervention":[194],"external":[196],"information,":[197],"SPECFIX":[198],"modified":[199,207],"43.58%":[200],"improving":[203],"Pass@1":[204],"set":[208],"30.9%.":[210],"This":[211],"yields":[212],"4.09%":[214],"absolute":[215],"improvement":[216],"across":[217,224],"entire":[219],"benchmark.":[220],"Repairs":[221],"also":[222],"transfer":[223],"models:":[225],"repaired":[227],"one":[229],"model":[230],"improve":[231],"other":[232],"models\u2019":[233],"performance":[234],"10.48%.":[236]},"counts_by_year":[],"updated_date":"2026-01-29T23:17:01.242718","created_date":"2026-01-29T00:00:00"}
