{"id":"https://openalex.org/W7139953340","doi":"https://doi.org/10.48550/arxiv.2603.18126","title":"A Survey of Neural Network Variational Monte Carlo from a Computing Workload Characterization Perspective","display_name":"A Survey of Neural Network Variational Monte Carlo from a Computing Workload Characterization Perspective","publication_year":2026,"publication_date":"2026-03-18","ids":{"openalex":"https://openalex.org/W7139953340","doi":"https://doi.org/10.48550/arxiv.2603.18126"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.18126","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18126","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.18126","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130253848","display_name":"Zhengze Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xiao, Zhengze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130243531","display_name":"Xuanzhe Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Xuanzhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130222548","display_name":"Yuyang Lou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lou, Yuyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130230635","display_name":"Lixue Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Lixue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5065172226","display_name":"Chaojian Li","orcid":"https://orcid.org/0000-0003-4030-9777"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chaojian","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5130253848"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.4415000081062317,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.4415000081062317,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.1915999948978424,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.17710000276565552,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6654000282287598},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.6263999938964844},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.48179998993873596},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4487000107765198},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.439300000667572},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.39469999074935913},{"id":"https://openalex.org/keywords/distributed-memory","display_name":"Distributed memory","score":0.35580000281333923},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.3433000147342682}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7615000009536743},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6654000282287598},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.6263999938964844},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.48179998993873596},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4487000107765198},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.439300000667572},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4066999852657318},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.39469999074935913},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.35580000281333923},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3449000120162964},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.3433000147342682},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3379000127315521},{"id":"https://openalex.org/C63320529","wikidata":"https://www.wikidata.org/wiki/Q7269435","display_name":"Quasi-Monte Carlo method","level":5,"score":0.32440000772476196},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3197000026702881},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3158000111579895},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3025999963283539},{"id":"https://openalex.org/C2780841128","wikidata":"https://www.wikidata.org/wiki/Q5073781","display_name":"Characterization (materials science)","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C46149586","wikidata":"https://www.wikidata.org/wiki/Q11785332","display_name":"Monte Carlo tree search","level":3,"score":0.2874000072479248},{"id":"https://openalex.org/C2778652916","wikidata":"https://www.wikidata.org/wiki/Q7915793","display_name":"Variational Monte Carlo","level":4,"score":0.2858999967575073},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C13153151","wikidata":"https://www.wikidata.org/wiki/Q1639846","display_name":"Hybrid Monte Carlo","level":4,"score":0.28369998931884766},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2734000086784363},{"id":"https://openalex.org/C132725507","wikidata":"https://www.wikidata.org/wiki/Q39879","display_name":"Monte Carlo integration","level":5,"score":0.25940001010894775}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.18126","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18126","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.18126","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18126","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Neural":[0],"Network":[1],"Variational":[2],"Monte":[3,20,68],"Carlo":[4,21,69],"(NNVMC)":[5],"has":[6],"emerged":[7],"as":[8],"a":[9,87,104],"promising":[10],"paradigm":[11],"for":[12,163],"solving":[13],"quantum":[14],"many-body":[15],"problems":[16],"by":[17,41,63,138],"combining":[18],"variational":[19],"with":[22,33,54],"expressive":[23],"neural-network":[24],"wave-function":[25,71],"ans\u00e4tze.":[26],"Although":[27],"NNVMC":[28,59,165],"can":[29],"achieve":[30],"competitive":[31],"accuracy":[32],"favorable":[34],"asymptotic":[35],"scaling,":[36],"practical":[37],"deployment":[38],"remains":[39],"limited":[40],"high":[42],"runtime":[43,111],"and":[44,56,73,81,90,101,112,115,125,141,152,172],"memory":[45,113],"cost":[46],"on":[47,155],"modern":[48],"graphics":[49],"processing":[50],"units":[51],"(GPUs).":[52],"Compared":[53],"language":[55],"vision":[57],"workloads,":[58],"execution":[60],"is":[61,135],"shaped":[62],"physics-specific":[64],"stages,":[65],"including":[66,167],"Markov-Chain":[67],"sampling,":[70],"construction,":[72],"derivative/Laplacian":[74],"evaluation,":[75],"which":[76],"produce":[77],"heterogeneous":[78,173],"kernel":[79],"behavior":[80,117],"nontrivial":[82],"bottlenecks.":[83],"This":[84],"paper":[85],"provides":[86],"workload-oriented":[88],"survey":[89],"empirical":[91],"GPU":[92],"characterization":[93],"of":[94],"four":[95],"representative":[96],"ans\u00e4tze:":[97],"PauliNet,":[98],"FermiNet,":[99],"Psiformer,":[100],"Orbformer.":[102],"Using":[103],"unified":[105],"profiling":[106],"protocol,":[107],"we":[108,158],"analyze":[109],"model-level":[110],"trends":[114],"kernel-level":[116],"through":[118],"family":[119],"breakdown,":[120],"arithmetic":[121],"intensity,":[122],"roofline":[123],"positioning,":[124],"hardware":[126],"utilization":[127],"counters.":[128],"The":[129],"results":[130],"show":[131],"that":[132],"end-to-end":[133],"performance":[134],"often":[136],"constrained":[137],"low-intensity":[139],"elementwise":[140],"data-movement":[142],"kernels,":[143],"while":[144],"the":[145],"compute/memory":[146],"balance":[147],"varies":[148],"substantially":[149],"across":[150],"ans\u00e4tze":[151],"stages.":[153],"Based":[154],"these":[156],"findings,":[157],"discuss":[159],"algorithm--hardware":[160],"co-design":[161],"implications":[162],"scalable":[164],"systems,":[166],"phase-aware":[168],"scheduling,":[169],"memory-centric":[170],"optimization,":[171],"acceleration.":[174]},"counts_by_year":[],"updated_date":"2026-03-21T06:36:02.116451","created_date":"2026-03-21T00:00:00"}
