{"id":"https://openalex.org/W7158220680","doi":"https://doi.org/10.48550/arxiv.2604.25904","title":"Teacher Forcing as Generalized Bayes: Optimization Geometry Mismatch in Switching Surrogates for Chaotic Dynamics","display_name":"Teacher Forcing as Generalized Bayes: Optimization Geometry Mismatch in Switching Surrogates for Chaotic Dynamics","publication_year":2026,"publication_date":"2026-04-28","ids":{"openalex":"https://openalex.org/W7158220680","doi":"https://doi.org/10.48550/arxiv.2604.25904"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.25904","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25904","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.25904","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134855966","display_name":"Andre Herz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Herz, Andre","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056788018","display_name":"Daniel Durstewitz","orcid":"https://orcid.org/0000-0002-9340-3786"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Durstewitz, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5012894482","display_name":"Georgia Koppe","orcid":"https://orcid.org/0000-0003-2941-9238"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koppe, Georgia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.33719998598098755,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.33719998598098755,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.1152999997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.11209999769926071,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forcing","display_name":"Forcing (mathematics)","score":0.7868000268936157},{"id":"https://openalex.org/keywords/chaotic","display_name":"Chaotic","score":0.7159000039100647},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6262999773025513},{"id":"https://openalex.org/keywords/curvature","display_name":"Curvature","score":0.5246000289916992},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4571000039577484},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4293000102043152},{"id":"https://openalex.org/keywords/dynamical-systems-theory","display_name":"Dynamical systems theory","score":0.4088999927043915},{"id":"https://openalex.org/keywords/bayes-theorem","display_name":"Bayes' theorem","score":0.3853999972343445},{"id":"https://openalex.org/keywords/dynamical-system","display_name":"Dynamical system (definition)","score":0.3736000061035156}],"concepts":[{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.7868000268936157},{"id":"https://openalex.org/C2777052490","wikidata":"https://www.wikidata.org/wiki/Q5072826","display_name":"Chaotic","level":2,"score":0.7159000039100647},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6308000087738037},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6262999773025513},{"id":"https://openalex.org/C195065555","wikidata":"https://www.wikidata.org/wiki/Q214881","display_name":"Curvature","level":2,"score":0.5246000289916992},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4571000039577484},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4293000102043152},{"id":"https://openalex.org/C79379906","wikidata":"https://www.wikidata.org/wiki/Q3174497","display_name":"Dynamical systems theory","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.3853999972343445},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3750999867916107},{"id":"https://openalex.org/C33962884","wikidata":"https://www.wikidata.org/wiki/Q378637","display_name":"Dynamical system (definition)","level":3,"score":0.3736000061035156},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3617999851703644},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C109546454","wikidata":"https://www.wikidata.org/wiki/Q3798604","display_name":"Information geometry","level":4,"score":0.32409998774528503},{"id":"https://openalex.org/C2780713532","wikidata":"https://www.wikidata.org/wiki/Q93158","display_name":"Edge of chaos","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.3021000027656555},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.30090001225471497},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.298799991607666},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.29760000109672546},{"id":"https://openalex.org/C95923904","wikidata":"https://www.wikidata.org/wiki/Q6760420","display_name":"Marginal likelihood","level":3,"score":0.2946999967098236},{"id":"https://openalex.org/C2776799497","wikidata":"https://www.wikidata.org/wiki/Q484298","display_name":"Surface (topology)","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.29260000586509705},{"id":"https://openalex.org/C2987469083","wikidata":"https://www.wikidata.org/wiki/Q166314","display_name":"Chaotic systems","level":3,"score":0.2824000120162964},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C29406490","wikidata":"https://www.wikidata.org/wiki/Q1420659","display_name":"Fisher information","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.25904","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25904","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.25904","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25904","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5134584903717041}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Identity":[0],"teacher":[1,47],"forcing":[2,48],"(ITF)":[3],"enables":[4],"stable":[5],"training":[6],"of":[7,63,73,130],"deterministic":[8],"recurrent":[9,26],"surrogates":[10],"for":[11,20],"chaotic":[12],"dynamical":[13,21,128],"systems":[14,22],"and":[15,65],"has":[16],"been":[17],"highly":[18],"effective":[19],"reconstruction":[23],"(DSR)":[24],"with":[25],"neural":[27],"networks":[28],"(RNNs),":[29],"including":[30],"interpretable":[31],"almost-linear":[32],"RNNs":[33],"(AL-RNNs).":[34],"However,":[35],"as":[36],"an":[37],"intervention-based":[38],"prediction":[39],"loss":[40],"(and":[41],"thus":[42],"a":[43,69,90,107],"generalized":[44],"Bayes":[45],"update),":[46],"need":[49],"not":[50],"match":[51],"the":[52,60,83],"free-running":[53],"model's":[54],"marginal":[55,66,101],"likelihood":[56,67,102],"geometry.":[57],"We":[58],"compare":[59],"objective-induced":[61],"curvatures":[62],"ITF":[64,96],"in":[68],"probabilistic":[70],"switching":[71,84,112],"augmentation":[72],"AL-RNNs,":[74],"estimating":[75],"ambiguity-aware":[76],"observed":[77],"information":[78],"via":[79],"Louis'":[80],"identity.":[81],"In":[82,116],"setting":[85],"studied":[86],"here,":[87],"conditioning":[88],"on":[89],"single":[91],"forced":[92],"regime":[93],"path":[94],"(as":[95],"does)":[97],"inflates":[98],"curvature,":[99],"while":[100],"curvature":[103],"is":[104],"reduced":[105],"by":[106],"missing-information":[108],"correction":[109],"when":[110],"multiple":[111],"explanations":[113],"remain":[114],"plausible.":[115],"Lorenz-63":[117],"experiments,":[118],"windowed":[119],"evidence":[120,124],"fine-tuning":[121],"improves":[122],"held-out":[123],"but":[125],"can":[126],"degrade":[127],"quantities":[129],"interest":[131],"(QoIs)":[132],"relative":[133],"to":[134],"ITF-pretrained":[135],"models.":[136]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-30T00:00:00"}
