{"id":"https://openalex.org/W4403536473","doi":"https://doi.org/10.1145/3691620.3695072","title":"How Effectively Do Code Language Models Understand Poor-Readability Code?","display_name":"How Effectively Do Code Language Models Understand Poor-Readability Code?","publication_year":2024,"publication_date":"2024-10-18","ids":{"openalex":"https://openalex.org/W4403536473","doi":"https://doi.org/10.1145/3691620.3695072"},"language":"en","primary_location":{"id":"doi:10.1145/3691620.3695072","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3691620.3695072","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th IEEE/ACM International Conference on Automated Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103386678","display_name":"Can Hu","orcid":"https://orcid.org/0009-0007-0713-4393"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chao Hu","raw_affiliation_strings":["School of Software, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012766337","display_name":"Yitian Chai","orcid":"https://orcid.org/0000-0002-2491-366X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yitian Chai","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111208115","display_name":"Haochen Zhou","orcid":"https://orcid.org/0000-0002-3587-5013"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Zhou","raw_affiliation_strings":["WeChat AI, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat AI, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024849044","display_name":"Fandong Meng","orcid":"https://orcid.org/0000-0002-8158-2377"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fandong Meng","raw_affiliation_strings":["WeChat AI, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat AI, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100770464","display_name":"Jie Zhou","orcid":"https://orcid.org/0000-0002-5899-5165"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Zhou","raw_affiliation_strings":["Tencent Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tencent Inc., Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033286111","display_name":"Xiaodong Gu","orcid":"https://orcid.org/0000-0002-0529-6408"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Gu","raw_affiliation_strings":["School of Software, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5103386678"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":1.0425,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.81403485,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"795","last_page":"806"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9718999862670898,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8113603591918945},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.6772609949111938},{"id":"https://openalex.org/keywords/readability","display_name":"Readability","score":0.5985431671142578},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5042241811752319}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8113603591918945},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6772609949111938},{"id":"https://openalex.org/C2778143727","wikidata":"https://www.wikidata.org/wiki/Q1820650","display_name":"Readability","level":2,"score":0.5985431671142578},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5042241811752319},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3691620.3695072","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3691620.3695072","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th IEEE/ACM International Conference on Automated Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/1","score":0.6200000047683716,"display_name":"No poverty"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2014232144","https://openalex.org/W2142112143","https://openalex.org/W2159739762","https://openalex.org/W2463537704","https://openalex.org/W2516621648","https://openalex.org/W2749460454","https://openalex.org/W2884276923","https://openalex.org/W2889391561","https://openalex.org/W2892187814","https://openalex.org/W2991900764","https://openalex.org/W3004658838","https://openalex.org/W3093415205","https://openalex.org/W3098605233","https://openalex.org/W3106692695","https://openalex.org/W3109966548","https://openalex.org/W3155146092","https://openalex.org/W3188431509","https://openalex.org/W3190338376","https://openalex.org/W3198685994","https://openalex.org/W3214739505","https://openalex.org/W4205371973","https://openalex.org/W4210499321","https://openalex.org/W4283751459","https://openalex.org/W4284667247","https://openalex.org/W4308641647","https://openalex.org/W4308731473","https://openalex.org/W4382317573","https://openalex.org/W4385571808","https://openalex.org/W4394746523"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W1964661231","https://openalex.org/W4254960163","https://openalex.org/W3110264473","https://openalex.org/W2999103397","https://openalex.org/W2370831213","https://openalex.org/W4315704968","https://openalex.org/W4285478380"],"abstract_inverted_index":{"Code":[0],"language":[1],"models":[2,41,87,108,212],"such":[3,202],"as":[4,203],"CodeT5":[5],"and":[6,27,177,185,219,226],"CodeLlama":[7],"have":[8,21],"demonstrated":[9],"substantial":[10],"achievement":[11],"in":[12,54],"code":[13,39,53,85,89,106,112,163,189,223],"comprehension.":[14],"While":[15],"the":[16,33,49,63,67,71,82,126,130,143,153,171,209],"majority":[17],"of":[18,48,51,66,84,188,211],"research":[19],"efforts":[20],"focused":[22],"on":[23,122,152,162,213],"improving":[24],"model":[25],"architectures":[26],"training":[28],"processes,":[29],"we":[30,80,155],"find":[31],"that":[32,104],"current":[34,105],"benchmarks":[35,134,206],"used":[36],"for":[37,199,222],"evaluating":[38,138],"comprehension":[40],"are":[42,59,109,135],"confined":[43],"to":[44,61,73,88,111,146,207],"high-readability":[45],"code,":[46,127,215],"regardless":[47],"popularity":[50],"low-readability":[52],"reality.":[55],"As":[56],"such,":[57],"they":[58],"inadequate":[60],"demonstrate":[62],"full":[64],"spectrum":[65],"model's":[68],"ability,":[69],"particularly":[70],"robustness":[72,83,210],"varying":[74,91],"readability":[75,169],"degrees.":[76],"In":[77,116],"this":[78],"paper,":[79],"analyze":[81],"summarization":[86,107,164,190],"with":[90,113],"readability,":[92],"including":[93],"seven":[94],"obfuscated":[95],"datasets":[96],"derived":[97],"from":[98],"existing":[99],"benchmarks.":[100],"Our":[101,192],"findings":[102],"indicate":[103],"vulnerable":[110],"poor":[114],"readability.":[115],"particular,":[117],"their":[118,178],"performance":[119],"predominantly":[120],"depends":[121],"semantic":[123,139],"cues":[124],"within":[125],"often":[128],"neglecting":[129],"syntactic":[131,149],"aspects.":[132],"Existing":[133],"biased":[136],"toward":[137],"features,":[140],"thereby":[141,180],"overlooking":[142],"models'":[144],"ability":[145],"understand":[147],"nonsensitive":[148],"features.":[150],"Based":[151],"findings,":[154],"present":[156],"Poor-CodeSumEval,":[157],"a":[158,182],"new":[159],"evaluation":[160,187],"benchmark":[161],"tasks.":[165],"PoorCodeSumEval":[166],"innovatively":[167],"introduces":[168],"into":[170],"testing":[172],"process,":[173],"considering":[174],"semantic,":[175],"syntactic,":[176],"cross-obfuscation,":[179],"providing":[181],"more":[183,196],"comprehensive":[184],"rigorous":[186],"models.":[191],"studies":[193],"also":[194],"provide":[195],"insightful":[197],"suggestions":[198],"future":[200],"research,":[201],"constructing":[204],"multi-readability":[205],"evaluate":[208],"poor-readability":[214],"proposing":[216],"readability-awareness":[217],"metrics,":[218],"automatic":[220],"methods":[221],"data":[224],"cleaning":[225],"normalization.":[227]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
