{"id":"https://openalex.org/W3027682703","doi":"https://doi.org/10.1007/s10208-020-09460-1","title":"A Neural Network-Based Policy Iteration Algorithm with Global $$H^2$$-Superlinear Convergence for Stochastic Games on Domains","display_name":"A Neural Network-Based Policy Iteration Algorithm with Global $$H^2$$-Superlinear Convergence for Stochastic Games on Domains","publication_year":2020,"publication_date":"2020-05-18","ids":{"openalex":"https://openalex.org/W3027682703","doi":"https://doi.org/10.1007/s10208-020-09460-1","mag":"3027682703"},"language":"en","primary_location":{"id":"doi:10.1007/s10208-020-09460-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10208-020-09460-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10208-020-09460-1.pdf","source":{"id":"https://openalex.org/S151639445","display_name":"Foundations of Computational Mathematics","issn_l":"1615-3375","issn":["1615-3375","1615-3383"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Foundations of Computational Mathematics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10208-020-09460-1.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004826461","display_name":"Kazufumi Ito","orcid":"https://orcid.org/0000-0003-2417-2600"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kazufumi Ito","raw_affiliation_strings":["Department of Mathematics, North Carolina State University, Raleigh, NC, 27607, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics, North Carolina State University, Raleigh, NC, 27607, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013285444","display_name":"Christoph Reisinger","orcid":"https://orcid.org/0000-0003-4027-5298"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Christoph Reisinger","raw_affiliation_strings":["Mathematical Institute, University of Oxford, Oxford, OX2 6GG, UK"],"affiliations":[{"raw_affiliation_string":"Mathematical Institute, University of Oxford, Oxford, OX2 6GG, UK","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100324331","display_name":"Yufei Zhang","orcid":"https://orcid.org/0000-0001-9843-1404"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yufei Zhang","raw_affiliation_strings":["Mathematical Institute, University of Oxford, Oxford, OX2 6GG, UK"],"affiliations":[{"raw_affiliation_string":"Mathematical Institute, University of Oxford, Oxford, OX2 6GG, UK","institution_ids":["https://openalex.org/I40120149"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004826461"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":1.5992,"has_fulltext":true,"cited_by_count":27,"citation_normalized_percentile":{"value":0.83094768,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"21","issue":"2","first_page":"331","last_page":"374"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10360","display_name":"Fluid Dynamics and Turbulent Flows","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10067","display_name":"Stochastic processes and financial applications","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.616872251033783},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.59517502784729},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5235785245895386},{"id":"https://openalex.org/keywords/numerical-analysis","display_name":"Numerical analysis","score":0.5028175711631775},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.47755512595176697},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4507279098033905},{"id":"https://openalex.org/keywords/ansatz","display_name":"Ansatz","score":0.433530330657959},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.39924219250679016},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3191877007484436},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.2112646996974945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.08831971883773804}],"concepts":[{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.616872251033783},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.59517502784729},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5235785245895386},{"id":"https://openalex.org/C48753275","wikidata":"https://www.wikidata.org/wiki/Q11216","display_name":"Numerical analysis","level":2,"score":0.5028175711631775},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.47755512595176697},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4507279098033905},{"id":"https://openalex.org/C130979935","wikidata":"https://www.wikidata.org/wiki/Q568954","display_name":"Ansatz","level":2,"score":0.433530330657959},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.39924219250679016},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3191877007484436},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.2112646996974945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.08831971883773804},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10208-020-09460-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10208-020-09460-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10208-020-09460-1.pdf","source":{"id":"https://openalex.org/S151639445","display_name":"Foundations of Computational Mathematics","issn_l":"1615-3375","issn":["1615-3375","1615-3383"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Foundations of Computational Mathematics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10208-020-09460-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10208-020-09460-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10208-020-09460-1.pdf","source":{"id":"https://openalex.org/S151639445","display_name":"Foundations of Computational Mathematics","issn_l":"1615-3375","issn":["1615-3375","1615-3383"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Foundations of Computational Mathematics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320290","display_name":"University of Oxford","ror":"https://ror.org/052gg0110"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3027682703.pdf","grobid_xml":"https://content.openalex.org/works/W3027682703.grobid-xml"},"referenced_works_count":51,"referenced_works":["https://openalex.org/W581038412","https://openalex.org/W1492326914","https://openalex.org/W1516903196","https://openalex.org/W1555557982","https://openalex.org/W1586623601","https://openalex.org/W1593542532","https://openalex.org/W1753318419","https://openalex.org/W1866311589","https://openalex.org/W1891592265","https://openalex.org/W1964377184","https://openalex.org/W1970030120","https://openalex.org/W1981493390","https://openalex.org/W2026365342","https://openalex.org/W2027197837","https://openalex.org/W2042154949","https://openalex.org/W2042680115","https://openalex.org/W2047090868","https://openalex.org/W2060171102","https://openalex.org/W2061508005","https://openalex.org/W2066572496","https://openalex.org/W2068328804","https://openalex.org/W2077040879","https://openalex.org/W2087003257","https://openalex.org/W2088299544","https://openalex.org/W2103255584","https://openalex.org/W2121005322","https://openalex.org/W2145348031","https://openalex.org/W2149713433","https://openalex.org/W2158985775","https://openalex.org/W2328013571","https://openalex.org/W2470369492","https://openalex.org/W2588542536","https://openalex.org/W2625995436","https://openalex.org/W2749028154","https://openalex.org/W2760972773","https://openalex.org/W2770250658","https://openalex.org/W2925136200","https://openalex.org/W2945971353","https://openalex.org/W2964121744","https://openalex.org/W2964328368","https://openalex.org/W2982781555","https://openalex.org/W3001199727","https://openalex.org/W3099661895","https://openalex.org/W3101159108","https://openalex.org/W3101260193","https://openalex.org/W3105898488","https://openalex.org/W3106269269","https://openalex.org/W4292166829","https://openalex.org/W4292360407","https://openalex.org/W4302367620","https://openalex.org/W6600474023"],"related_works":["https://openalex.org/W2089909466","https://openalex.org/W2986094430","https://openalex.org/W3208000705","https://openalex.org/W2089799198","https://openalex.org/W2126034343","https://openalex.org/W3193597985","https://openalex.org/W2460950183","https://openalex.org/W3014952517","https://openalex.org/W2032748140","https://openalex.org/W2392523851"],"abstract_inverted_index":{"Abstract":[0],"In":[1],"this":[2,82],"work,":[3],"we":[4,100],"propose":[5],"a":[6,42,53],"class":[7],"of":[8,26,44,148],"numerical":[9,63,108,115],"schemes":[10,116],"for":[11,95],"solving":[12],"semilinear":[13,39],"Hamilton\u2013Jacobi\u2013Bellman\u2013Isaacs":[14],"(HJBI)":[15],"boundary":[16,126],"value":[17,109],"problems":[18,25],"which":[19,48],"arise":[20],"naturally":[21],"from":[22,106],"exit":[23],"time":[24],"diffusion":[27],"processes":[28],"with":[29],"controlled":[30],"drift.":[31],"We":[32,59],"exploit":[33],"policy":[34],"iteration":[35,94],"to":[36,123,138,144],"reduce":[37],"the":[38,62,68,88,96,102,107,131,140,146,149],"problem":[40,135],"into":[41],"sequence":[43],"linear":[45],"Dirichlet":[46],"problems,":[47],"are":[49,120,136],"subsequently":[50],"approximated":[51],"by":[52,86],"multilayer":[54],"feedforward":[55],"neural":[56],"network":[57],"ansatz.":[58],"establish":[60],"that":[61,81],"solutions":[64],"converge":[65],"globally":[66],"in":[67],"$$H^2$$":[69],"<mml:math":[70],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\">":[71],"<mml:msup>":[72],"<mml:mi>H</mml:mi>":[73],"<mml:mn>2</mml:mn>":[74],"</mml:msup>":[75],"</mml:math>":[76],"-norm":[77],"and":[78,111,117,143],"further":[79],"demonstrate":[80,145],"convergence":[83,118],"is":[84],"superlinear,":[85],"interpreting":[87],"algorithm":[89],"as":[90],"an":[91],"inexact":[92],"Newton":[93],"HJBI":[97],"equation.":[98],"Moreover,":[99],"construct":[101],"optimal":[103],"feedback":[104],"controls":[105],"functions":[110],"deduce":[112],"convergence.":[113],"The":[114],"results":[119,142],"then":[121],"extended":[122],"oblique":[124],"derivative":[125],"conditions.":[127],"Numerical":[128],"experiments":[129],"on":[130],"stochastic":[132],"Zermelo":[133],"navigation":[134],"presented":[137],"illustrate":[139],"theoretical":[141],"effectiveness":[147],"method.":[150]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
