{"id":"https://openalex.org/W4414763085","doi":"https://doi.org/10.48550/arxiv.2509.05282","title":"Elucidating the Design Space of Decay in Linear Attention","display_name":"Elucidating the Design Space of Decay in Linear Attention","publication_year":2025,"publication_date":"2025-09-05","ids":{"openalex":"https://openalex.org/W4414763085","doi":"https://doi.org/10.48550/arxiv.2509.05282"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2509.05282","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.05282","pdf_url":"https://arxiv.org/pdf/2509.05282","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.05282","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101829994","display_name":"Zhen Qin","orcid":"https://orcid.org/0000-0002-9991-7024"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qin, Zhen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063135412","display_name":"Xuyang Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xuyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5082015443","display_name":"Ying Zhong","orcid":"https://orcid.org/0000-0003-3169-7069"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Yiran","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101829994"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.8277999758720398,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.8277999758720398,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalar","display_name":"Scalar (mathematics)","score":0.6560999751091003},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5234000086784363},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4316999912261963},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.3882000148296356},{"id":"https://openalex.org/keywords/parameter-space","display_name":"Parameter space","score":0.3856000006198883},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.367000013589859},{"id":"https://openalex.org/keywords/scalar-potential","display_name":"Scalar potential","score":0.3463999927043915},{"id":"https://openalex.org/keywords/exponential-decay","display_name":"Exponential decay","score":0.3443000018596649}],"concepts":[{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.6560999751091003},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5234000086784363},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.49000000953674316},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.435699999332428},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4316999912261963},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.4268999993801117},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.40869998931884766},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3882000148296356},{"id":"https://openalex.org/C73586568","wikidata":"https://www.wikidata.org/wiki/Q2600211","display_name":"Parameter space","level":2,"score":0.3856000006198883},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.367000013589859},{"id":"https://openalex.org/C31836371","wikidata":"https://www.wikidata.org/wiki/Q1856609","display_name":"Scalar potential","level":2,"score":0.3463999927043915},{"id":"https://openalex.org/C180188523","wikidata":"https://www.wikidata.org/wiki/Q574576","display_name":"Exponential decay","level":2,"score":0.3443000018596649},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.3370000123977661},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3165000081062317},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.3077999949455261},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C2778648169","wikidata":"https://www.wikidata.org/wiki/Q967768","display_name":"Compatibility (geochemistry)","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C75235859","wikidata":"https://www.wikidata.org/wiki/Q582659","display_name":"Exponential growth","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.26440000534057617},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2509.05282","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.05282","pdf_url":"https://arxiv.org/pdf/2509.05282","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.05282","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.05282","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.05282","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.05282","pdf_url":"https://arxiv.org/pdf/2509.05282","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,110,176],"comprehensive":[4],"investigation":[5],"into":[6],"the":[7,19,34,43,89,92,190],"decay":[8,23,49,51,96,126,145,162,167],"mechanisms":[9,24],"inherent":[10],"in":[11,154,168],"linear":[12,193],"complexity":[13],"sequence":[14],"models.":[15],"We":[16],"systematically":[17],"delineate":[18],"design":[20,90],"space":[21],"of":[22,45,75,91,113,192],"across":[25],"four":[26],"pivotal":[27],"dimensions:":[28],"parameterization":[29,93,142,159],"strategy,":[30],"which":[31,41],"refers":[32],"to":[33,109,128,149,185,189],"computational":[35],"methodology":[36],"for":[37,48,95],"decay;":[38,57],"parameter":[39,116],"sharing,":[40],"involves":[42],"utilization":[44],"supplementary":[46],"parameters":[47],"computation;":[50],"granularity,":[52],"comparing":[53],"scalar":[54,144,161],"versus":[55],"vector-based":[56,151],"and":[58],"compatibility":[59],"with":[60,157],"relative":[61,179],"positional":[62,180],"encoding":[63,181],"methods,":[64],"such":[65],"as":[66,122],"Rotary":[67],"Position":[68],"Embedding":[69],"(RoPE).":[70],"Through":[71],"an":[72],"extensive":[73],"series":[74],"experiments":[76],"conducted":[77],"on":[78],"diverse":[79],"language":[80],"modeling":[81],"tasks,":[82],"we":[83],"uncovered":[84],"several":[85],"critical":[86],"insights.":[87],"Firstly,":[88],"strategy":[94],"requires":[97],"meticulous":[98],"consideration.":[99],"Our":[100],"findings":[101],"indicate":[102],"that":[103,174],"effective":[104],"configurations":[105],"are":[106],"typically":[107,183],"confined":[108],"specific":[111],"range":[112],"parameters.":[114],"Secondly,":[115],"sharing":[117],"cannot":[118],"be":[119,129],"used":[120],"arbitrarily,":[121],"it":[123],"may":[124,163],"cause":[125],"values":[127],"too":[130,133],"large":[131],"or":[132],"small,":[134],"thereby":[135],"significantly":[136],"impacting":[137],"performance.":[138],"Thirdly,":[139],"under":[140],"identical":[141],"strategies,":[143,160],"generally":[146],"underperforms":[147],"compared":[148],"its":[150],"counterpart.":[152],"However,":[153],"certain":[155],"scenarios":[156],"alternative":[158],"unexpectedly":[164],"surpass":[165],"vector":[166],"efficacy.":[169],"Lastly,":[170],"our":[171],"analysis":[172],"reveals":[173],"RoPE,":[175],"commonly":[177],"employed":[178],"method,":[182],"fails":[184],"provide":[186],"tangible":[187],"benefits":[188],"majority":[191],"attention":[194],"mechanisms.":[195]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
