{"id":"https://openalex.org/W4402670059","doi":"https://doi.org/10.18653/v1/2024.findings-acl.576","title":"Understanding and Patching Compositional Reasoning in LLMs","display_name":"Understanding and Patching Compositional Reasoning in LLMs","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402670059","doi":"https://doi.org/10.18653/v1/2024.findings-acl.576"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2024.findings-acl.576","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.576","pdf_url":"https://aclanthology.org/2024.findings-acl.576.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2024.findings-acl.576.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049050227","display_name":"Z. Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhaoyi Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107506903","display_name":"Gangwei Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gangwei Jiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034462876","display_name":"Hong Xie","orcid":"https://orcid.org/0000-0001-6610-0723"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong Xie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101308839","display_name":"Linqi Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Linqi Song","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085254654","display_name":"Defu Lian","orcid":"https://orcid.org/0000-0002-3507-9607"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Defu Lian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5107904074","display_name":"Ying Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ying Wei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5049050227"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.139,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89254987,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"9668","last_page":"9688"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.8112999796867371,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.8112999796867371,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.7760999798774719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.7609999775886536,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5060178637504578}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5060178637504578}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/2024.findings-acl.576","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.576","pdf_url":"https://aclanthology.org/2024.findings-acl.576.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:publications/8d56d92a-fbb6-4904-80af-1657b4d94e03","is_oa":true,"landing_page_url":"https://hdl.handle.net/2031/8d56d92a-fbb6-4904-80af-1657b4d94e03","pdf_url":null,"source":{"id":"https://openalex.org/S7407055387","display_name":"CityU Scholars","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Li, Z, Jiang, G, Xie, H, Song, L, Lian, D & Wei, Y 2024, Understanding and Patching Compositional Reasoning in LLMs. in L-W Ku, A Martins & V Srikumar (eds), 62nd Annual Meeting of the Association for Computational Linguistics (ACL 2024) - Proceedings of the Conference. Proceedings of the Annual Meeting of the Association for Computational Linguistics, Association for Computational Linguistics, Kerrville, TX, pp. 9668-9688, 62nd Annual Meeting of the Association for Computational Linguistics (ACL 2024), Bangkok, Thailand, 11/08/24. https://doi.org/10.18653/v1/2024.findings-acl.576","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"doi:10.18653/v1/2024.findings-acl.576","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.576","pdf_url":"https://aclanthology.org/2024.findings-acl.576.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3643945900","display_name":null,"funder_award_id":"62371411","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4386184646","display_name":null,"funder_award_id":"2371411","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8513333314","display_name":null,"funder_award_id":"2021ZD01","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322499","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4402670059.pdf","grobid_xml":"https://content.openalex.org/works/W4402670059.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"LLMs":[0],"have":[1],"marked":[2],"a":[3,18,81,122],"revolutonary":[4],"shift,":[5],"yet":[6],"they":[7],"falter":[8],"when":[9],"faced":[10],"with":[11],"compositional":[12,26,129,152],"reasoning":[13,27,44,72,89,113,130,153],"tasks.Our":[14],"research":[15],"embarks":[16],"on":[17,115],"quest":[19],"to":[20,52,59,125,141],"uncover":[21],"the":[22,38,61,86,104,116,133,145],"root":[23],"causes":[24],"of":[25,29,34,65,111],"failures":[28],"LLMs,":[30],"uncovering":[31],"that":[32,70],"most":[33],"them":[35],"stem":[36],"from":[37],"improperly":[39],"generated":[40],"or":[41],"leveraged":[42],"implicit":[43,71,112],"results.Inspired":[45],"by":[46],"our":[47],"empirical":[48,137],"findings,":[49,118],"we":[50,119],"resort":[51],"Logit":[53],"Lens":[54],"and":[55,79,109,149],"an":[56],"intervention":[57],"experiment":[58],"dissect":[60],"inner":[62],"hidden":[63],"states":[64],"LLMs.This":[66],"deep":[67],"dive":[68],"reveals":[69],"results":[73],"indeed":[74],"surface":[75],"within":[76,98],"middle":[77],"layers":[78],"play":[80],"causative":[82],"role":[83],"in":[84,106,128,155],"shaping":[85],"final":[87],"explicit":[88],"results.Our":[90],"exploration":[91],"further":[92],"locates":[93],"multi-head":[94],"self-attention":[95],"(MHSA)":[96],"modules":[97],"these":[99],"layers,":[100],"which":[101],"emerge":[102],"as":[103],"linchpins":[105],"accurate":[107],"generation":[108],"leveraing":[110],"results.Grounded":[114],"above":[117],"develop":[120],"CREME,":[121],"lightweight":[123],"method":[124],"patch":[126],"errors":[127],"via":[131],"editing":[132],"located":[134],"MHSA":[135],"modules.Our":[136],"evidence":[138],"stands":[139],"testament":[140],"CREME's":[142],"effectiveness,":[143],"paving":[144],"way":[146],"for":[147],"autonomously":[148],"continuously":[150],"enhancing":[151],"capabilities":[154],"language":[156],"models.":[157]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
