{"id":"https://openalex.org/W7151094260","doi":"https://doi.org/10.48550/arxiv.2604.02969","title":"Inversion-Free Natural Gradient Descent on Riemannian Manifolds","display_name":"Inversion-Free Natural Gradient Descent on Riemannian Manifolds","publication_year":2026,"publication_date":"2026-04-03","ids":{"openalex":"https://openalex.org/W7151094260","doi":"https://doi.org/10.48550/arxiv.2604.02969"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.02969","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02969","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.02969","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133014801","display_name":"Dario Draca","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Draca, Dario","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061412524","display_name":"Takuo Matsubara","orcid":"https://orcid.org/0000-0003-2177-3056"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matsubara, Takuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133043223","display_name":"Minh-Ngoc Tran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tran, Minh-Ngoc","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9361000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9361000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.030899999663233757,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.013399999588727951,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/statistical-manifold","display_name":"Statistical manifold","score":0.7321000099182129},{"id":"https://openalex.org/keywords/information-geometry","display_name":"Information geometry","score":0.7145000100135803},{"id":"https://openalex.org/keywords/riemannian-manifold","display_name":"Riemannian manifold","score":0.5831999778747559},{"id":"https://openalex.org/keywords/geodesic","display_name":"Geodesic","score":0.5817000269889832},{"id":"https://openalex.org/keywords/exponential-map","display_name":"Exponential map (Riemannian geometry)","score":0.5483999848365784},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.5253000259399414},{"id":"https://openalex.org/keywords/manifold","display_name":"Manifold (fluid mechanics)","score":0.4936000108718872},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.4569999873638153},{"id":"https://openalex.org/keywords/fisher-information","display_name":"Fisher information","score":0.44279998540878296},{"id":"https://openalex.org/keywords/positive-definiteness","display_name":"Positive definiteness","score":0.41819998621940613}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.843500018119812},{"id":"https://openalex.org/C169391604","wikidata":"https://www.wikidata.org/wiki/Q7604402","display_name":"Statistical manifold","level":5,"score":0.7321000099182129},{"id":"https://openalex.org/C109546454","wikidata":"https://www.wikidata.org/wiki/Q3798604","display_name":"Information geometry","level":4,"score":0.7145000100135803},{"id":"https://openalex.org/C2779593128","wikidata":"https://www.wikidata.org/wiki/Q632814","display_name":"Riemannian manifold","level":2,"score":0.5831999778747559},{"id":"https://openalex.org/C165818556","wikidata":"https://www.wikidata.org/wiki/Q213488","display_name":"Geodesic","level":2,"score":0.5817000269889832},{"id":"https://openalex.org/C102224218","wikidata":"https://www.wikidata.org/wiki/Q25344559","display_name":"Exponential map (Riemannian geometry)","level":5,"score":0.5483999848365784},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.5253000259399414},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.5023999810218811},{"id":"https://openalex.org/C529865628","wikidata":"https://www.wikidata.org/wiki/Q1790740","display_name":"Manifold (fluid mechanics)","level":2,"score":0.4936000108718872},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.4569999873638153},{"id":"https://openalex.org/C29406490","wikidata":"https://www.wikidata.org/wiki/Q1420659","display_name":"Fisher information","level":2,"score":0.44279998540878296},{"id":"https://openalex.org/C2778265155","wikidata":"https://www.wikidata.org/wiki/Q7233276","display_name":"Positive definiteness","level":4,"score":0.41819998621940613},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.39800000190734863},{"id":"https://openalex.org/C157157409","wikidata":"https://www.wikidata.org/wiki/Q909601","display_name":"Tangent space","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.3564999997615814},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.3553999960422516},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.3474999964237213},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.34049999713897705},{"id":"https://openalex.org/C47890412","wikidata":"https://www.wikidata.org/wiki/Q1179296","display_name":"Tangent vector","level":3,"score":0.33469998836517334},{"id":"https://openalex.org/C129782007","wikidata":"https://www.wikidata.org/wiki/Q162886","display_name":"Euclidean geometry","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C2777634741","wikidata":"https://www.wikidata.org/wiki/Q768993","display_name":"Wasserstein metric","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C152442038","wikidata":"https://www.wikidata.org/wiki/Q2778212","display_name":"Tikhonov regularization","level":3,"score":0.3197999894618988},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.31619998812675476},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C203616005","wikidata":"https://www.wikidata.org/wiki/Q620495","display_name":"Hessian matrix","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C138187205","wikidata":"https://www.wikidata.org/wiki/Q131251","display_name":"Tangent","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C82668687","wikidata":"https://www.wikidata.org/wiki/Q3046456","display_name":"Earth mover's distance","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C120174047","wikidata":"https://www.wikidata.org/wiki/Q847073","display_name":"Euclidean distance","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.26669999957084656},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C64812099","wikidata":"https://www.wikidata.org/wiki/Q176604","display_name":"Random matrix","level":3,"score":0.2621999979019165},{"id":"https://openalex.org/C2777630202","wikidata":"https://www.wikidata.org/wiki/Q5527840","display_name":"Gaussian measure","level":3,"score":0.2612999975681305},{"id":"https://openalex.org/C181104567","wikidata":"https://www.wikidata.org/wiki/Q761383","display_name":"Riemannian geometry","level":2,"score":0.2549000084400177}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.02969","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02969","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.02969","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02969","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"natural":[1,48,71],"gradient":[2,49],"method":[3,50,161],"is":[4,15,89,100,108,149],"a":[5,21,92,135],"central":[6],"tool":[7],"for":[8,51,69,129,138,152],"statistical":[9,52,62],"optimisation,":[10],"but":[11],"its":[12,39],"broader":[13],"application":[14],"hindered":[16],"by":[17],"the":[18,25,29,35,70,76,82,96,104,130,139,157,166,172],"assumption":[19],"of":[20,28,38,73,78,84,95,124,132,159],"Euclidean":[22],"parameter":[23,74],"space,":[24],"repeated":[26],"estimation":[27],"Fisher":[30],"information":[31],"matrix":[32,117],"(FIM),":[33],"and":[34,81,134,175],"computational":[36],"cost":[37],"subsequent":[40],"inversion.":[41],"This":[42,106],"paper":[43],"proposes":[44],"an":[45],"intrinsic,":[46],"inversion-free":[47],"models":[53],"whose":[54],"parameters":[55],"lie":[56],"on":[57,91,103,162,171],"general":[58],"Riemannian":[59],"manifolds.":[60],"Formulating":[61],"optimisation":[63],"in":[64],"this":[65],"non-Euclidean":[66],"setting":[67],"allows":[68],"enforcement":[72],"constraints,":[75],"elimination":[77],"non-identifiable":[79],"parameters,":[80],"exploitation":[83],"geodesic":[85],"convexity.":[86],"Our":[87],"algorithm":[88],"based":[90],"moving":[93],"approximation":[94,107],"inverse":[97],"FIM,":[98],"which":[99],"maintained":[101],"directly":[102],"manifold.":[105],"efficiently":[109],"updated":[110],"with":[111,145],"new":[112],"score":[113],"vectors":[114],"using":[115],"low-rank":[116],"identities.":[118],"We":[119,155],"prove":[120],"almost-sure":[121],"convergence":[122],"rates":[123],"$O(\\log":[125],"s":[126],"/":[127],"s^\u03b1)$":[128],"sequence":[131],"iterates,":[133],"similar":[136],"rate":[137],"approximate":[140],"FIM.":[141],"A":[142],"limited-memory":[143],"variant":[144],"sub-quadratic":[146],"storage":[147],"complexity":[148],"further":[150],"proposed":[151],"large-scale":[153],"applications.":[154],"demonstrate":[156],"efficacy":[158],"our":[160],"variational":[163],"Bayes":[164],"within":[165],"Bures-Wasserstein":[167],"manifold,":[168,174],"normalising":[169],"flows":[170],"Stiefel":[173],"reduced-rank":[176],"logistic":[177],"regression.":[178]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-07T00:00:00"}
