{"id":"https://openalex.org/W7162414363","doi":"https://doi.org/10.48550/arxiv.2605.26035","title":"Length Generalization with Log-Depth Recurrent Units","display_name":"Length Generalization with Log-Depth Recurrent Units","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162414363","doi":"https://doi.org/10.48550/arxiv.2605.26035"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.26035","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26035","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.26035","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099173706","display_name":"Charles Pert","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pert, Charles","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029277829","display_name":"Dalal Alrajeh","orcid":"https://orcid.org/0000-0002-1365-8026"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alrajeh, Dalal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137042689","display_name":"Alessandra Russo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Russo, Alessandra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.24690000712871552,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.24690000712871552,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.22210000455379486,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.05119999870657921,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5939000248908997},{"id":"https://openalex.org/keywords/prefix","display_name":"Prefix","score":0.5938000082969666},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.49140000343322754},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4242999851703644},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.41819998621940613},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.37599998712539673},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3569999933242798},{"id":"https://openalex.org/keywords/type","display_name":"Type (biology)","score":0.3156999945640564}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5939000248908997},{"id":"https://openalex.org/C141603448","wikidata":"https://www.wikidata.org/wiki/Q134830","display_name":"Prefix","level":2,"score":0.5938000082969666},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5845000147819519},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5249999761581421},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49230000376701355},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.49140000343322754},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4242999851703644},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3871999979019165},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3598000109195709},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3569999933242798},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.32339999079704285},{"id":"https://openalex.org/C2777299769","wikidata":"https://www.wikidata.org/wiki/Q3707858","display_name":"Type (biology)","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.30390000343322754},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.30149999260902405},{"id":"https://openalex.org/C117765406","wikidata":"https://www.wikidata.org/wiki/Q5362437","display_name":"Generalization error","level":3,"score":0.3012000024318695},{"id":"https://openalex.org/C52370388","wikidata":"https://www.wikidata.org/wiki/Q752532","display_name":"Regular language","level":3,"score":0.30000001192092896},{"id":"https://openalex.org/C24858836","wikidata":"https://www.wikidata.org/wiki/Q844718","display_name":"Theory of computation","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.2727000117301941},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.25450000166893005}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.26035","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26035","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.26035","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26035","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Length":[0],"generalization":[1],"remains":[2],"a":[3,28,49,57],"persistent":[4],"challenge":[5],"for":[6,32,42],"neural":[7],"networks:":[8],"recurrent":[9,108],"models":[10],"tend":[11],"to":[12,63],"suffer":[13],"from":[14],"positional":[15],"biases,":[16],"while":[17],"transformers":[18],"are":[19],"constrained":[20],"by":[21],"fixed":[22],"computational":[23],"depth.":[24],"Regular":[25],"languages":[26,118],"provide":[27],"frequently":[29],"used":[30],"testbed":[31],"evaluating":[33],"length":[34],"generalization,":[35],"as":[36],"label":[37],"prediction":[38],"can":[39],"be":[40],"checked":[41],"any":[43],"sequence":[44],"length.":[45],"We":[46,69,112],"propose":[47],"MLP-LDRU,":[48],"type":[50],"of":[51,59,77],"Log-Depth":[52],"Recurrent":[53],"Unit,":[54],"which":[55],"captures":[56],"class":[58],"associativity-biased":[60],"operators":[61],"designed":[62],"approximate":[64],"recurrence":[65],"through":[66],"parallel":[67],"reduction.":[68],"evaluate":[70,114],"MLP-LDRU":[71,115],"on":[72,90,97,119],"21":[73],"regular-language":[74],"tasks,":[75],"consisting":[76],"standard":[78],"benchmarks":[79],"and":[80,93,109,121],"new":[81],"prefix":[82],"languages,":[83],"where":[84,125],"it":[85,126],"achieves":[86],"100%":[87],"out-of-distribution":[88],"accuracy":[89],"18":[91],"tasks":[92],"at":[94],"least":[95],"99.9%":[96],"the":[98],"remaining":[99],"3":[100],"when":[101],"increasing":[102],"max":[103],"training":[104],"length,":[105],"outperforming":[106],"comparable":[107],"attention-based":[110],"models.":[111],"further":[113],"beyond":[116],"regular":[117],"ListOps":[120],"NLP":[122],"classification":[123],"benchmarks,":[124],"performs":[127],"competitively.":[128]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
