{"id":"https://openalex.org/W7133349887","doi":"https://doi.org/10.48550/arxiv.2603.01047","title":"Evaluating GFlowNet from partial episodes for stable and flexible policy-based training","display_name":"Evaluating GFlowNet from partial episodes for stable and flexible policy-based training","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133349887","doi":"https://doi.org/10.48550/arxiv.2603.01047"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01047","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127900570","display_name":"Puhua Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Niu, Puhua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128008670","display_name":"Shili Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Shili","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5073946580","display_name":"Xiaoning Qian","orcid":"https://orcid.org/0000-0002-4347-2476"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Xiaoning","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5127900570"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5214999914169312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5214999914169312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.11620000004768372,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.053700000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.7282000184059143},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.7027000188827515},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5622000098228455},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.531499981880188},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.483599990606308},{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.47859999537467957},{"id":"https://openalex.org/keywords/balance","display_name":"Balance (ability)","score":0.46459999680519104},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.39089998602867126}],"concepts":[{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.7282000184059143},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.7027000188827515},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5889000296592712},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5622000098228455},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.531499981880188},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.483599990606308},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.47859999537467957},{"id":"https://openalex.org/C168031717","wikidata":"https://www.wikidata.org/wiki/Q1530280","display_name":"Balance (ability)","level":2,"score":0.46459999680519104},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41339999437332153},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.39089998602867126},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38609999418258667},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.36239999532699585},{"id":"https://openalex.org/C74197172","wikidata":"https://www.wikidata.org/wiki/Q1195339","display_name":"Directed acyclic graph","level":2,"score":0.35409998893737793},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.35260000824928284},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.328900009393692},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.3034999966621399},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3012999892234802},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26969999074935913},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4025932550430298,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generative":[0],"Flow":[1],"Networks":[2],"(GFlowNets)":[3],"were":[4],"developed":[5],"to":[6,33],"learn":[7],"policies":[8,150],"for":[9,118],"efficiently":[10],"sampling":[11],"combinatorial":[12],"candidates":[13],"by":[14,93,145],"interpreting":[15],"their":[16],"generative":[17],"processes":[18],"as":[19],"trajectories":[20],"in":[21],"directed":[22,80],"acyclic":[23,81],"graphs.":[24],"In":[25],"the":[26,30,35,41,44,48,52,66,71,77,90,106,120,135,153],"value-based":[27],"training":[28,139],"workflow,":[29],"objective":[31,112],"is":[32,116],"enforce":[34],"balance":[36,97,111,131],"over":[37,113],"partial":[38,114],"episodes":[39,115],"between":[40,64],"flows":[42,50],"of":[43,51,76,137,155],"learned":[45],"policy":[46,57,67,102],"and":[47,69,108,127,151],"estimated":[49],"desired":[53],"policy,":[54,72],"implicitly":[55],"encouraging":[56],"divergence":[58,68,78],"minimization.":[59],"The":[60],"policy-based":[61,138],"strategy":[62],"alternates":[63],"estimating":[65],"updating":[70],"but":[73,140],"reliable":[74],"estimation":[75],"under":[79],"graphs":[82],"remains":[83],"a":[84,100],"major":[85],"challenge.":[86],"This":[87],"work":[88],"bridges":[89],"two":[91],"perspectives":[92],"showing":[94],"that":[95,104],"flow":[96],"also":[98,141],"yields":[99],"principled":[101],"evaluator":[103],"measures":[105],"divergence,":[107],"an":[109],"evaluation":[110,130],"proposed":[117],"learning":[119],"evaluator.":[121],"As":[122],"demonstrated":[123],"on":[124],"both":[125],"synthetic":[126],"real-world":[128],"tasks,":[129],"not":[132],"only":[133],"strengthens":[134],"reliability":[136],"broadens":[142],"its":[143],"flexibility":[144],"seamlessly":[146],"supporting":[147],"parameterized":[148],"backward":[149],"enabling":[152],"integration":[154],"offline":[156],"data-collection":[157],"techniques.":[158]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
