{"id":"https://openalex.org/W4412944872","doi":"https://doi.org/10.18653/v1/2025.acl-long.957","title":"LLMs can be easily Confused by Instructional Distractions","display_name":"LLMs can be easily Confused by Instructional Distractions","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412944872","doi":"https://doi.org/10.18653/v1/2025.acl-long.957"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-long.957","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.957","pdf_url":"https://aclanthology.org/2025.acl-long.957.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-long.957.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119204390","display_name":"Yerin Hwang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yerin Hwang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103104054","display_name":"Yongil Kim","orcid":"https://orcid.org/0000-0003-0458-5280"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yongil Kim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114619388","display_name":"Jahyun Koo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jahyun Koo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082023846","display_name":"Taegwan Kang","orcid":"https://orcid.org/0000-0002-9171-357X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taegwan Kang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102579943","display_name":"Hyunkyung Bae","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hyunkyung Bae","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077832834","display_name":"Kyomin Jung","orcid":"https://orcid.org/0000-0003-2547-7051"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kyomin Jung","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5119204390"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.22909347,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"19483","last_page":"19496"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.04690000042319298,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.04690000042319298,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6232380270957947}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6232380270957947}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.acl-long.957","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.957","pdf_url":"https://aclanthology.org/2025.acl-long.957.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-long.957","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.957","pdf_url":"https://aclanthology.org/2025.acl-long.957.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1451011034","display_name":null,"funder_award_id":"2021-II212068","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G3598079552","display_name":null,"funder_award_id":"RS-2021-II211343","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G5439187163","display_name":null,"funder_award_id":"RS-2021-II21206","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G7288789209","display_name":null,"funder_award_id":"RS-2021-II211343","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G7575369263","display_name":null,"funder_award_id":"RS-2021-II212068","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G7699972493","display_name":null,"funder_award_id":"RS-2021-II212068","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G7798134731","display_name":null,"funder_award_id":"RS-2021-II211343","funder_id":"https://openalex.org/F4320321292","funder_display_name":"Seoul National University"}],"funders":[{"id":"https://openalex.org/F4320321292","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"},{"id":"https://openalex.org/F4320335489","display_name":"Institute for Information and Communications Technology Promotion","ror":"https://ror.org/01g0hqq23"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412944872.pdf","grobid_xml":"https://content.openalex.org/works/W4412944872.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Despite":[0],"the":[1,23,43,50,68,72,137,168,177],"fact":[2],"that":[3,135],"large":[4],"language":[5],"models":[6,24,172],"(LLMs)":[7],"show":[8],"exceptional":[9],"skill":[10],"in":[11,153,173],"instruction":[12,70,111],"following":[13,31],"tasks,":[14],"this":[15,76,81],"strength":[16],"can":[17],"turn":[18],"into":[19],"a":[20,35,85],"vulnerability":[21],"when":[22,49],"are":[25,141,158],"required":[26],"to":[27,46,65,75,92,143,148,182],"disregard":[28],"certain":[29],"instructions.Instruction":[30],"tasks":[32],"typically":[33],"involve":[34],"clear":[36],"task":[37,69],"description":[38],"and":[39,71,106,116,129,165],"input":[40,51,120],"text":[41],"containing":[42],"target":[44,178],"data":[45],"be":[47,183],"processed.However,":[48],"itself":[52],"resembles":[53],"an":[54],"instruction,":[55],"confusion":[56],"may":[57,180],"arise,":[58],"even":[59,136],"if":[60],"there":[61],"is":[62],"explicit":[63],"prompting":[64],"distinguish":[66],"between":[67],"input.We":[73],"refer":[74],"phenomenon":[77],"as":[78],"instructional":[79,97,104,144,175],"distraction.In":[80],"paper,":[82],"we":[83],"introduce":[84],"novel":[86],"benchmark,":[87],"named":[88],"DIM-Bench,":[89],"specifically":[90],"designed":[91],"assess":[93],"LLMs'":[94],"performance":[95],"under":[96],"distraction.The":[98],"benchmark":[99],"categorizes":[100],"real-world":[101],"instances":[102],"of":[103,170],"distraction":[105],"evaluates":[107],"LLMs":[108,140],"across":[109],"four":[110],"tasks:":[112,121],"rewriting,":[113],"proofreading,":[114],"translation,":[115],"style":[117],"transfer-alongside":[118],"five":[119],"reasoning,":[122,126],"code":[123],"generation,":[124],"mathematical":[125],"bias":[127],"detection,":[128],"question":[130],"answering.Our":[131],"experimental":[132],"results":[133],"reveal":[134],"most":[138],"advanced":[139],"susceptible":[142],"distraction,":[145],"often":[146],"failing":[147],"accurately":[149],"follow":[150],"user":[151],"intent":[152],"such":[154],"cases.*":[155],"These":[156],"languages":[157,179],"commonly":[159],"supported":[160],"by":[161],"Llama":[162],"3.1,":[163],"GPT-3.5,":[164],"GPT-4o.To":[166],"evaluate":[167],"robustness":[169],"other":[171],"handling":[174],"distractions,":[176],"need":[181],"adjusted":[184],"accordingly.":[185]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
