{"id":"https://openalex.org/W7125928527","doi":"https://doi.org/10.1109/ase63991.2025.00088","title":"Automated Inline Comment Smell Detection and Repair with Large Language Models","display_name":"Automated Inline Comment Smell Detection and Repair with Large Language Models","publication_year":2025,"publication_date":"2025-11-16","ids":{"openalex":"https://openalex.org/W7125928527","doi":"https://doi.org/10.1109/ase63991.2025.00088"},"language":null,"primary_location":{"id":"doi:10.1109/ase63991.2025.00088","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5118792447","display_name":"Hatice K\u00fcbra \u00c7a\u011flar","orcid":null},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Hatice K\u00fcbra \u00c7a\u011flar","raw_affiliation_strings":["Bilkent University Udemy, Inc.,Computer Science,Ankara,Turkey"],"affiliations":[{"raw_affiliation_string":"Bilkent University Udemy, Inc.,Computer Science,Ankara,Turkey","institution_ids":["https://openalex.org/I168864056"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111926375","display_name":"Semih \u00c7a\u011flar","orcid":null},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Semih \u00c7a\u011flar","raw_affiliation_strings":["Bilkent University,Computer Science,Ankara,Turkey"],"affiliations":[{"raw_affiliation_string":"Bilkent University,Computer Science,Ankara,Turkey","institution_ids":["https://openalex.org/I168864056"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5093220032","display_name":"Eray T\u00fcz\u00fcn","orcid":null},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Eray T\u00fcz\u00fcn","raw_affiliation_strings":["Bilkent University,Computer Science,Ankara,Turkey"],"affiliations":[{"raw_affiliation_string":"Bilkent University,Computer Science,Ankara,Turkey","institution_ids":["https://openalex.org/I168864056"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5118792447"],"corresponding_institution_ids":["https://openalex.org/I168864056"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.85240326,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1008","last_page":"1019"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0052999998442828655,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code-smell","display_name":"Code smell","score":0.8438000082969666},{"id":"https://openalex.org/keywords/macro","display_name":"Macro","score":0.6628999710083008},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5914000272750854},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5802000164985657},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4966999888420105},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.47029998898506165},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.41190001368522644}],"concepts":[{"id":"https://openalex.org/C133237599","wikidata":"https://www.wikidata.org/wiki/Q2295111","display_name":"Code smell","level":5,"score":0.8438000082969666},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7300999760627747},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.6628999710083008},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5914000272750854},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5802000164985657},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4966999888420105},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.47029998898506165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.459199994802475},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41920000314712524},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.35589998960494995},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3538999855518341},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3402999937534332},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.302700012922287},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.30239999294281006},{"id":"https://openalex.org/C148524875","wikidata":"https://www.wikidata.org/wiki/Q6975395","display_name":"F1 score","level":2,"score":0.2833999991416931},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27379998564720154},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ase63991.2025.00088","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2005422315","https://openalex.org/W2053154970","https://openalex.org/W2118655104","https://openalex.org/W2152874840","https://openalex.org/W2293265747","https://openalex.org/W2954876572","https://openalex.org/W2963672599","https://openalex.org/W2999309192","https://openalex.org/W3015080226","https://openalex.org/W3086831424","https://openalex.org/W3122527318","https://openalex.org/W3174589346","https://openalex.org/W3197666682","https://openalex.org/W3215377758","https://openalex.org/W4206738852","https://openalex.org/W4281384435","https://openalex.org/W4284889817","https://openalex.org/W4320490961","https://openalex.org/W4384302749","https://openalex.org/W4388593316","https://openalex.org/W4390638022","https://openalex.org/W4393870628","https://openalex.org/W4399667815","https://openalex.org/W4411552084"],"related_works":[],"abstract_inverted_index":{"Context:":[0],"Code":[1],"comments":[2,16],"play":[3],"a":[4,72,105,115,259,363],"critical":[5],"role":[6],"in":[7,32,68,95,127,149,250],"improving":[8],"code":[9,27,101,109],"readability,":[10],"maintainability,":[11],"and":[12,98,135,140,152,170,182,238,268,272,323,347,368,376],"collaborative":[13],"development.":[14],"However,":[15],"may":[17],"deviate":[18],"from":[19,337],"best":[20,209,256],"practices":[21],"due":[22],"to":[23,50,206],"software":[24,56],"evolution,":[25],"where":[26,194],"changes":[28],"are":[29,66,217,283],"not":[30],"reflected":[31],"comments,":[33,125],"as":[34,36,40,291,345],"well":[35],"practitioner-related":[37],"issues":[38,48],"such":[39,290,344],"vague":[41],"descriptions,":[42],"redundancy,":[43],"or":[44,77],"misaligned":[45],"intent.":[46],"These":[47],"lead":[49],"various":[51],"comment":[52,63,102,110,365],"smells":[53,76],"that":[54],"degrade":[55],"quality.":[57],"While":[58],"prior":[59,116],"studies":[60],"have":[61],"explored":[62],"inconsistencies,":[64],"most":[65],"limited":[67],"scope,":[69],"either":[70],"addressing":[71],"narrow":[73],"subset":[74],"of":[75,90,108,123,233,236,240,245,263,318,321,325,350,359],"focusing":[78],"solely":[79],"on":[80,372],"detection":[81,188,196,229,296,314],"without":[82],"considering":[83],"repair.Objective:":[84],"This":[85],"study":[86],"evaluates":[87],"the":[88,191,195,199,208,226,243,251,255,311,328,348,357],"effectiveness":[89],"large":[91],"language":[92],"models":[93],"(LLMs)":[94],"both":[96],"detecting":[97],"repairing":[99],"inline":[100],"smells,":[103],"using":[104,165,178],"comprehensive":[106],"taxonomy":[107],"smell":[111],"types.Method:":[112],"We":[113],"extended":[114],"data":[117],"set":[118],"by":[119,266,300],"incorporating":[120],"repaired":[121],"versions":[122],"smelly":[124],"resulting":[126],"2,211":[128],"unique":[129],"instances.":[130],"Four":[131],"LLMs\u2014GPT-4o-mini,":[132],"o3-mini,":[133],"DeepSeek-V3,":[134],"Codestral-2501\u2014are":[136],"evaluated":[137,177],"under":[138],"zero-shot":[139,252,281,338],"few-shot":[141,223,302,308],"prompting":[142,224,309],"strategies.":[143],"To":[144],"account":[145],"for":[146,219,286],"non-deterministic":[147],"behavior":[148],"LLM":[150],"outputs":[151,189],"ensure":[153],"robustness,":[154],"each":[155],"configuration":[156],"is":[157,163,176,204],"executed":[158],"five":[159],"times.":[160],"Detection":[161],"performance":[162,297],"measured":[164],"accuracy,":[166],"macro":[167,201,231,316],"F1":[168,202,232,317],"score,":[169],"Matthews":[171],"correlation":[172],"coefficient":[173],"(MCC);":[174],"repair":[175,192,211,333,366],"SBERT":[179,261],"similarity,":[180],"METEOR,":[181],"ROUGE-L.":[183],"Our":[184,354],"multi-stage":[185],"pipeline":[186],"feeds":[187],"into":[190],"phase,":[193],"result":[197],"with":[198,222,258,307],"highest":[200,227,312],"score":[203,262],"used":[205],"simulate":[207],"possible":[210],"scenario.":[212],"Median":[213],"scores":[214],"across":[215],"runs":[216],"reported":[218],"comparison.Results:":[220],"o3-mini":[221,273,292,306],"achieves":[225],"median":[228,260,313],"performance:":[230],"0.41,":[234,319],"MCC":[235,320],"0.50,":[237,322],"accuracy":[239,324],"0.72,":[241,326],"exceeding":[242],"baseline":[244],"GPT-4.":[246],"For":[247,304],"repair,":[248],"Codestral-2501":[249],"setting":[253],"yields":[254],"results":[257],"0.61,":[264],"followed":[265],"DeepSeek-V3":[267],"GPT-4o-mini":[269],"at":[270,274],"0.53,":[271],"0.46.":[275],"Few-shot":[276],"prompts":[277,282],"improve":[278],"detection,":[279],"while":[280],"more":[284,336],"effective":[285,301],"repair.Conclusion:":[287],"Lightweight":[288],"LLMs":[289],"can":[293],"achieve":[294],"strong":[295],"when":[298],"guided":[299],"prompts.":[303],"example,":[305],"attains":[310],"results:":[315],"surpassing":[327],"GPT-4":[329],"baseline.":[330],"In":[331],"contrast,":[332],"tasks":[334],"benefit":[335],"prompting,":[339],"though":[340],"they":[341],"introduce":[342],"challenges":[343],"overfitting":[346],"risk":[349],"generating":[351],"new":[352],"smells.":[353],"findings":[355],"support":[356],"development":[358],"practical":[360],"tools,":[361],"including":[362],"GitHub-integrated":[364],"assistant,":[367],"motivate":[369],"future":[370],"work":[371],"dynamic":[373],"prompt":[374],"selection":[375],"multilingual":[377],"benchmark":[378],"construction.":[379]},"counts_by_year":[],"updated_date":"2026-01-29T23:17:01.242718","created_date":"2026-01-29T00:00:00"}
