{"id":"https://openalex.org/W7160634767","doi":"https://doi.org/10.48550/arxiv.2605.06563","title":"Criticality and Saturation in Orthogonal Neural Networks","display_name":"Criticality and Saturation in Orthogonal Neural Networks","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160634767","doi":"https://doi.org/10.48550/arxiv.2605.06563"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.06563","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06563","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.06563","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073082430","display_name":"Max Guillen","orcid":"https://orcid.org/0000-0001-5442-8780"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guillen, Max","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135709047","display_name":"Jan E. Gerken","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gerken, Jan E.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.5178999900817871,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.5178999900817871,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.10849999636411667,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.054099999368190765,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recursion","display_name":"Recursion (computer science)","score":0.7135000228881836},{"id":"https://openalex.org/keywords/criticality","display_name":"Criticality","score":0.5461999773979187},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5385000109672546},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.5108000040054321},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.49880000948905945},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.48489999771118164},{"id":"https://openalex.org/keywords/series","display_name":"Series (stratigraphy)","score":0.4553999900817871},{"id":"https://openalex.org/keywords/orthogonal-polynomials","display_name":"Orthogonal polynomials","score":0.4104999899864197},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.37059998512268066}],"concepts":[{"id":"https://openalex.org/C168773036","wikidata":"https://www.wikidata.org/wiki/Q264164","display_name":"Recursion (computer science)","level":2,"score":0.7135000228881836},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6244000196456909},{"id":"https://openalex.org/C125611927","wikidata":"https://www.wikidata.org/wiki/Q17008131","display_name":"Criticality","level":2,"score":0.5461999773979187},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5385000109672546},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.5108000040054321},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.49880000948905945},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.48489999771118164},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.475600004196167},{"id":"https://openalex.org/C143724316","wikidata":"https://www.wikidata.org/wiki/Q312468","display_name":"Series (stratigraphy)","level":2,"score":0.4553999900817871},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.42660000920295715},{"id":"https://openalex.org/C10628310","wikidata":"https://www.wikidata.org/wiki/Q619458","display_name":"Orthogonal polynomials","level":2,"score":0.4104999899864197},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C65574998","wikidata":"https://www.wikidata.org/wiki/Q386272","display_name":"Feynman diagram","level":2,"score":0.3684000074863434},{"id":"https://openalex.org/C186080144","wikidata":"https://www.wikidata.org/wiki/Q358733","display_name":"Series expansion","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C176321772","wikidata":"https://www.wikidata.org/wiki/Q1430640","display_name":"Numerical stability","level":3,"score":0.29980000853538513},{"id":"https://openalex.org/C73905626","wikidata":"https://www.wikidata.org/wiki/Q206925","display_name":"Power series","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C143170015","wikidata":"https://www.wikidata.org/wiki/Q17007850","display_name":"Stability conditions","level":3,"score":0.2955999970436096},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C61445026","wikidata":"https://www.wikidata.org/wiki/Q217608","display_name":"Fixed point","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C9930424","wikidata":"https://www.wikidata.org/wiki/Q7426587","display_name":"Saturation (graph theory)","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.263700008392334},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.2606000006198883},{"id":"https://openalex.org/C92207270","wikidata":"https://www.wikidata.org/wiki/Q939253","display_name":"Matrix norm","level":3,"score":0.2554999887943268}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.06563","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06563","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.06563","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06563","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"It":[0],"has":[1],"been":[2],"known":[3],"for":[4,63,83,110,144,158],"a":[5,40,155,172],"long":[6],"time":[7],"that":[8,55,129,186],"initializing":[9],"weight":[10],"matrices":[11],"to":[12,68,120],"be":[13,28],"orthogonal":[14,99,169],"instead":[15],"of":[16,71,91,98,106,137,161,164,189],"having":[17],"i.i.d.":[18],"Gaussian":[19],"components":[20],"can":[21,27],"improve":[22],"training":[23],"performance.":[24],"This":[25,151],"phenomenon":[26],"analyzed":[29],"using":[30],"finite-width":[31,89,139],"corrections,":[32],"where":[33],"the":[34,56,69,84,88,92,96,111,115,130,135,138,159,176],"infinite-width":[35],"statistics":[36,94],"are":[37,118],"supplemented":[38],"by":[39,50,184],"power":[41],"series":[42],"in":[43,59,87,95,114,123,175],"$1/\\mathrm{width}$.":[44,124],"In":[45,74],"particular,":[46],"recent":[47],"empirical":[48],"results":[49,182],"Day":[51],"et":[52],"al.":[53],"show":[54,127],"tensors":[57,70,85,140],"appearing":[58,86],"this":[60,75],"treatment":[61],"stabilize":[62],"large":[64],"depth,":[65],"as":[66],"opposed":[67],"i.i.d.-initialized":[72],"networks.":[73],"article,":[76],"we":[77,126,132],"derive":[78,133],"explicit":[79],"layer-wise":[80],"recursion":[81,191],"relations":[82,192],"expansion":[90],"network":[93,204],"case":[97],"initializations.":[100],"We":[101,178],"also":[102],"provide":[103],"an":[104],"extension":[105],"recently-introduced":[107],"Feynman":[108],"diagrams":[109],"corresponding":[112],"recursions":[113,131],"i.i.d.-case":[116],"which":[117,141],"valid":[119],"all":[121],"orders":[122],"Finally,":[125],"explicitly":[128],"reproduce":[134],"stability":[136,160],"was":[142],"observed":[143],"activation":[145],"functions":[146],"with":[147,168,200],"vanishing":[148],"fixed":[149],"point.":[150],"work":[152],"therefore":[153],"provides":[154],"theoretical":[156,181],"explanation":[157],"nonlinear":[162],"networks":[163],"finite":[165],"width":[166],"initialized":[167],"weights,":[170],"closing":[171],"long-standing":[173],"gap":[174],"literature.":[177],"validate":[179],"our":[180,190],"experimentally":[183],"showing":[185],"numerical":[187],"solutions":[188],"and":[193],"their":[194],"analytical":[195],"large-depth":[196],"expansions":[197],"agree":[198],"excellently":[199],"Monte-Carlo":[201],"estimates":[202],"from":[203],"ensembles.":[205]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-09T00:00:00"}
