{"id":"https://openalex.org/W7131432429","doi":"https://doi.org/10.48550/arxiv.2602.19733","title":"Understanding the Curse of Unrolling","display_name":"Understanding the Curse of Unrolling","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131432429","doi":"https://doi.org/10.48550/arxiv.2602.19733"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19733","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000059907","display_name":"Sheheryar Mehmood","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mehmood, Sheheryar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002093701","display_name":"Florian Kn\u00f6ll","orcid":"https://orcid.org/0000-0001-5357-8656"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Knoll, Florian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126803939","display_name":"Peter Ochs","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ochs, Peter","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5000059907"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.7670000195503235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.7670000195503235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.03689999878406525,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.03550000116229057,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/iterated-function","display_name":"Iterated function","score":0.6391000151634216},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.5278000235557556},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5170000195503235},{"id":"https://openalex.org/keywords/loop-unrolling","display_name":"Loop unrolling","score":0.477400004863739},{"id":"https://openalex.org/keywords/curse","display_name":"Curse","score":0.4668000042438507},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4242999851703644},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4189000129699707},{"id":"https://openalex.org/keywords/phenomenon","display_name":"Phenomenon","score":0.37610000371932983}],"concepts":[{"id":"https://openalex.org/C140479938","wikidata":"https://www.wikidata.org/wiki/Q5254619","display_name":"Iterated function","level":2,"score":0.6391000151634216},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6358000040054321},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.5278000235557556},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5170000195503235},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4812999963760376},{"id":"https://openalex.org/C76970557","wikidata":"https://www.wikidata.org/wiki/Q1869750","display_name":"Loop unrolling","level":3,"score":0.477400004863739},{"id":"https://openalex.org/C2780273121","wikidata":"https://www.wikidata.org/wiki/Q109411","display_name":"Curse","level":2,"score":0.4668000042438507},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4242999851703644},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4189000129699707},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4090000092983246},{"id":"https://openalex.org/C50335755","wikidata":"https://www.wikidata.org/wiki/Q483247","display_name":"Phenomenon","level":2,"score":0.37610000371932983},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36480000615119934},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.362199991941452},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.33889999985694885},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.32690000534057617},{"id":"https://openalex.org/C181789720","wikidata":"https://www.wikidata.org/wiki/Q4812191","display_name":"Asymptotically optimal algorithm","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2971999943256378},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C2779922397","wikidata":"https://www.wikidata.org/wiki/Q5014755","display_name":"CVAR","level":4,"score":0.28349998593330383},{"id":"https://openalex.org/C134121241","wikidata":"https://www.wikidata.org/wiki/Q899301","display_name":"Yield (engineering)","level":2,"score":0.27709999680519104},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C52572940","wikidata":"https://www.wikidata.org/wiki/Q617228","display_name":"Winner's curse","level":3,"score":0.2694000005722046},{"id":"https://openalex.org/C111771559","wikidata":"https://www.wikidata.org/wiki/Q66295","display_name":"Derivative (finance)","level":2,"score":0.2694000005722046},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26589998602867126},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.2644999921321869}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4411710500717163}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Algorithm":[0],"unrolling":[1,26],"is":[2,27],"ubiquitous":[3],"in":[4,8,106],"machine":[5],"learning,":[6],"particularly":[7],"hyperparameter":[9],"optimization":[10,108],"and":[11,75],"meta-learning,":[12],"where":[13],"Jacobians":[14,33],"of":[15,58,72,89,114],"solution":[16],"mappings":[17],"are":[18,123],"computed":[19],"by":[20,125],"differentiating":[21],"through":[22],"iterative":[23],"algorithms.":[24],"Although":[25],"known":[28,54],"to":[29],"yield":[30],"asymptotically":[31],"correct":[32],"under":[34],"suitable":[35],"conditions,":[36],"recent":[37],"work":[38],"has":[39],"shown":[40],"that":[41,68,80,85,104],"the":[42,49,56,70,77,90,94],"derivative":[43,91],"iterates":[44],"may":[45],"initially":[46],"diverge":[47],"from":[48],"true":[50],"Jacobian,":[51],"a":[52,65,117],"phenomenon":[53],"as":[55],"curse":[57,95],"unrolling.":[59],"In":[60],"this":[61,73],"work,":[62],"we":[63,102],"provide":[64],"non-asymptotic":[66],"analysis":[67],"explains":[69],"origin":[71],"behavior":[74],"identifies":[76],"algorithmic":[78],"factors":[79],"govern":[81],"it.":[82],"We":[83],"show":[84],"truncating":[86],"early":[87],"iterations":[88],"computation":[92],"mitigates":[93],"while":[96],"simultaneously":[97],"reducing":[98],"memory":[99],"requirements.":[100],"Finally,":[101],"demonstrate":[103],"warm-starting":[105],"bilevel":[107],"naturally":[109],"induces":[110],"an":[111],"implicit":[112],"form":[113],"truncation,":[115],"providing":[116],"practical":[118],"remedy.":[119],"Our":[120],"theoretical":[121],"findings":[122],"supported":[124],"numerical":[126],"experiments":[127],"on":[128],"representative":[129],"examples.":[130]},"counts_by_year":[],"updated_date":"2026-02-26T06:34:08.959763","created_date":"2026-02-26T00:00:00"}
