{"id":"https://openalex.org/W7152650242","doi":"https://doi.org/10.1145/3774904.3792911","title":"PAOSC: Plug-and-play Attention Optimization for Semantic Consistency in LLMs","display_name":"PAOSC: Plug-and-play Attention Optimization for Semantic Consistency in LLMs","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W7152650242","doi":"https://doi.org/10.1145/3774904.3792911"},"language":null,"primary_location":{"id":"doi:10.1145/3774904.3792911","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792911","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3774904.3792911","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133305172","display_name":"Chang Li","orcid":"https://orcid.org/0009-0009-7695-7814"},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chang Li","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China"],"raw_orcid":"https://orcid.org/0009-0009-7695-7814","affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China","institution_ids":["https://openalex.org/I4210108629"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124203791","display_name":"Yawei Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yawei Liu","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China"],"raw_orcid":"https://orcid.org/0009-0009-3673-1597","affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China","institution_ids":["https://openalex.org/I4210108629"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133241058","display_name":"Chun Long","orcid":"https://orcid.org/0000-0003-0351-6486"},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chun Long","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China"],"raw_orcid":"https://orcid.org/0000-0003-0351-6486","affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China","institution_ids":["https://openalex.org/I4210108629"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133310982","display_name":"Jing Zhao","orcid":"https://orcid.org/0009-0001-5933-1301"},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Zhao","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China"],"raw_orcid":"https://orcid.org/0009-0001-5933-1301","affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China","institution_ids":["https://openalex.org/I4210108629"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063658622","display_name":"Guanyao Du","orcid":null},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanyao Du","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China"],"raw_orcid":"https://orcid.org/0009-0002-7988-8892","affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, BEIJING, China","institution_ids":["https://openalex.org/I4210108629"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5133305172"],"corresponding_institution_ids":["https://openalex.org/I4210108629"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.82210297,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"8565","last_page":"8568"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.3560999929904938,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.3560999929904938,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.2011999934911728,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.16529999673366547,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5378999710083008},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.26339998841285706},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.2558000087738037},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2533000111579895}],"concepts":[{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5378999710083008},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5178999900817871},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4510999917984009},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3061999976634979},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26339998841285706},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.25679999589920044},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2558000087738037},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.25360000133514404},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2533000111579895},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.23810000717639923}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3774904.3792911","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792911","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3774904.3792911","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792911","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W4221089501","https://openalex.org/W4388212317"],"related_works":[],"abstract_inverted_index":{"Attention":[0],"mechanisms":[1],"are":[2],"essential":[3],"to":[4,25,58,80,92,99,119],"the":[5,45,51,55,101,124,128],"success":[6],"of":[7,54,61,135],"Large":[8],"Language":[9],"Models":[10],"(LLMs).":[11],"In":[12],"practice,":[13],"models":[14],"often":[15,43],"overemphasize":[16],"semantically":[17],"low-value":[18,136],"tokens,":[19,137],"forming":[20],"attention":[21,40,48,76],"sinks":[22],"while":[23,141],"failing":[24],"capture":[26],"truly":[27],"informative":[28,94],"tokens.":[29],"Existing":[30],"inference-time":[31],"optimization":[32,77],"methods":[33],"mainly":[34],"rely":[35],"on":[36,107,114],"static":[37],"adjustments":[38],"or":[39],"redistribution,":[41],"which":[42],"disrupt":[44],"correspondence":[46],"between":[47],"distribution":[49],"and":[50,64,96,110],"actual":[52],"semantics":[53],"input,":[56],"leading":[57],"a":[59,74,90,97,120],"loss":[60,111],"semantic":[62,82,143],"consistency":[63,83],"degraded":[65],"performance.":[66],"To":[67],"address":[68],"this":[69],"problem,":[70],"we":[71],"propose":[72],"PAOSC,":[73],"plug-and-play":[75],"model":[78],"designed":[79],"maintain":[81],"by":[84],"dynamically":[85],"adjusting":[86],"attention.":[87],"PAOSC":[88,132],"employs":[89],"generator":[91,102],"identify":[93],"tokens":[95],"discriminator":[98],"optimize":[100],"via":[103],"policy":[104],"gradients":[105],"based":[106],"confidence":[108],"changes":[109],"fluctuations.":[112],"Experiments":[113],"eight":[115],"LLMs":[116],"show":[117],"up":[118],"9.68%":[121],"improvement":[122],"in":[123],"F1":[125],"score.":[126],"On":[127],"constructed":[129],"HTTP-RL":[130],"dataset,":[131],"eliminates":[133],"18%":[134],"improving":[138],"inference":[139],"efficiency":[140],"maintaining":[142],"consistency.":[144],"Our":[145],"code":[146],"is":[147],"available":[148],"at":[149],"https://github.com/ChangLi000/PAOSC.":[150]},"counts_by_year":[],"updated_date":"2026-04-11T06:13:24.991567","created_date":"2026-04-10T00:00:00"}
