{"id":"https://openalex.org/W4412888767","doi":"https://doi.org/10.18653/v1/2025.findings-acl.81","title":"TACO-RL: Task Aware Prompt Compression Optimization with Reinforcement Learning","display_name":"TACO-RL: Task Aware Prompt Compression Optimization with Reinforcement Learning","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412888767","doi":"https://doi.org/10.18653/v1/2025.findings-acl.81"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.findings-acl.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.81","pdf_url":"https://aclanthology.org/2025.findings-acl.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.findings-acl.81.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043547691","display_name":"Shivam Shandilya","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Shivam Shandilya","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111082345","display_name":"Menglin Xia","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Menglin Xia","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101775931","display_name":"Supriyo Ghosh","orcid":"https://orcid.org/0000-0001-7275-3296"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Supriyo Ghosh","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070156365","display_name":"Huiqiang Jiang","orcid":"https://orcid.org/0000-0002-1327-4882"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Huiqiang Jiang","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100752550","display_name":"Jue Zhang","orcid":"https://orcid.org/0000-0003-0440-1357"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jue Zhang","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076476133","display_name":"Qianhui Wu","orcid":"https://orcid.org/0000-0001-9567-4128"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Qianhui Wu","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049145726","display_name":"Victor R\u00fchle","orcid":"https://orcid.org/0000-0002-8957-7628"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Victor R\u00fchle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070722259","display_name":"Saravan Rajmohan","orcid":"https://orcid.org/0000-0002-2019-213X"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Saravan Rajmohan","raw_affiliation_strings":["Microsoft"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7378,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.83640061,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1582","last_page":"1597"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8415716290473938},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7374411225318909},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6637200117111206},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.5415293574333191},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.43285641074180603},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38650697469711304},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14556920528411865},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.07032984495162964}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8415716290473938},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7374411225318909},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6637200117111206},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.5415293574333191},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.43285641074180603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38650697469711304},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14556920528411865},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.07032984495162964},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.findings-acl.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.81","pdf_url":"https://aclanthology.org/2025.findings-acl.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.findings-acl.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.81","pdf_url":"https://aclanthology.org/2025.findings-acl.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412888767.pdf","grobid_xml":"https://content.openalex.org/works/W4412888767.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"The":[0],"increasing":[1],"prevalence":[2],"of":[3,22,124,262,275,329,340,355],"large":[4],"language":[5],"models":[6],"(LLMs)":[7],"such":[8,60],"as":[9,61,67],"GPT-4":[10],"in":[11,19,31,181,183,235,240,358,363],"various":[12],"applications":[13],"has":[14],"led":[15],"to":[16,29,36,75],"a":[17,68,84,260],"surge":[18],"the":[20,38,48,110,122,148,164,336,341,356],"size":[21],"prompts":[23],"required":[24],"for":[25],"optimal":[26],"performance,":[27],"leading":[28],"challenges":[30],"computational":[32],"efficiency.Prompt":[33],"compression":[34,53,94,145,160,166],"aims":[35],"reduce":[37],"inference":[39],"cost":[40],"by":[41,151],"minimizing":[42],"input":[43],"tokens":[44],"without":[45],"compromising":[46],"on":[47,57,127],"task":[49,149],"performance.However,":[50],"existing":[51,102],"prompt":[52,93],"techniques":[54,161],"either":[55],"rely":[56],"sub-optimal":[58],"metrics":[59],"information":[62],"entropy":[63],"or":[64,324,327,405],"model":[65,107],"it":[66],"task-agnostic":[69],"token":[70,105],"classification":[71,106],"problem":[72],"that":[73,142,257],"fails":[74],"capture":[76],"task-specific":[77,114],"information.To":[78],"address":[79],"these":[80,155],"issues,":[81],"we":[82,100],"propose":[83],"novel":[85],"and":[86,130,138,168,319,348],"efficient":[87],"reinforcement":[88],"learning":[89,111],"(RL)":[90],"based":[91],"task-aware":[92],"method.To":[95],"ensure":[96],"low":[97],"latency":[98,169],"requirements,":[99],"leverage":[101],"Transformer":[103],"encoder-based":[104],"while":[108,162],"guiding":[109],"process":[112],"with":[113],"reward":[115],"signals":[116],"using":[117],"lightweight":[118],"REINFORCE":[119],"algorithm.We":[120],"evaluate":[121],"performance":[123,150],"our":[125,143],"method":[126,146],"three":[128,156],"diverse":[129],"challenging":[131],"tasks":[132],"including":[133],"text":[134],"summarization,":[135],"question":[136],"answering":[137],"code":[139],"summarization.We":[140],"demonstrate":[141],"RL-guided":[144],"improves":[147],"8%":[152],"-189%":[153],"across":[154],"scenarios":[157],"over":[158],"state-of-the-art":[159],"satisfying":[163],"same":[165],"rate":[167],"requirements.Answer":[170],"\"4,404.5":[171,248],"people\"":[172,249],"Question":[173],"\"How":[174],"many":[175],"people":[176,200,268],"per":[177,201,269],"square":[178,202,270],"mile":[179,203,271],"lived":[180],"Fresno":[182,194,206,258,276],"2010?\"":[184],"QA":[185],"Task":[186,187,242],"Aware":[188],"Compressed":[189,366],"Text":[190],"2010":[191,252],"Census":[192,255,368],"reported":[193,256],"population":[195,261,264,343,357],"494,665.population":[196],"density":[197,265],"was":[198,266,277],"4,404.5":[199,267],"(1,700.6/km2).racial":[204],"makeup":[205,274],"245,306":[207,278,371],"(49.6%)White,":[208,279],"40,960":[209,280],"(8.3%)":[210,281],"African":[211,282],"American,":[212,283,287],"8,525":[213,284],"(1.7%)":[214,285],"Native":[215,286],"American":[216,374,376],"62,528.6%)Asian":[217],"849":[218,310],"(0":[219],"Pacific":[220,312,399],"Islander":[221,400],"111,984.6%24,513":[222],"Hispanic":[223,337,407],"232,055":[224,333],"(46.9%).42.7%":[225],"Mexican":[226,410],"0.4%":[227,229,306,346,349,395,411,413],"Salvadoran":[228,412],"Puerto":[230,350,414],"Rican.Non-Hispanic":[231,351],"Whites":[232,352],"were":[233,332,353],"30.0%":[234,354],"2010,":[236,359],"down":[237,360],"from":[238,316,322,361],"72.6%":[239,362],"1970":[241,418],"Specific":[243],"RL":[244],"Feedback":[245],"GPT":[246],"3.5":[247],"Original":[250],"ContextThe":[251],"United":[253],"States":[254],"had":[259],"494,665.The":[263],"(1,700.6/km).The":[272],"racial":[273],"62,528":[288,377],"(12.6%)Asian":[289],"(3.6%":[290,379],"Hmong,":[291],"1.7%":[292,381],"Indian,":[293],"1.2%":[294,296,383,385],"Filipino,":[295],"Laotian,":[297],"1.0%":[298,387],"Thai,":[299],"0.8%":[300,389],"Cambodian,":[301],"0.7%":[302,391],"Chinese,":[303],"0.5%":[304,393],"Japanese,":[305],"Vietnamese,":[307],"0.2%":[308,397],"Korean),":[309,398],"(0.2%)":[311],"Islander,":[313],"111,984":[314,401],"(22.6%)":[315],"other":[317,402],"races,":[318],"24,513":[320,403],"(5.0%)":[321],"two":[323,404],"more":[325,406],"races.Hispanic":[326],"Latino":[328],"any":[330],"race":[331],"persons":[334],"(46.9%).Among":[335],"population,":[338],"42.7%":[339,409],"total":[342],"are":[344],"Mexican,":[345],"Salvadoran,":[347],"1970.":[364],"LLMLingua":[365],"Text2010":[367],"Fresno,665":[369],"4":[370],"White":[372],"40,960.3%African":[373],"8,525.7%Native":[375],"Asian":[378],"Hmong":[380],"Indian":[382],"Filipino":[384],"Laotian":[386],"Thai":[388],"Cambodian":[390],"Chinese":[392],"Japanese":[394],"Vietnamese":[396],"Latino,055":[408],"Rican":[415],"Non-Hispanic":[416],"30.0%72.6%":[417]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
