{"id":"https://openalex.org/W4391670448","doi":"https://doi.org/10.48550/arxiv.2402.05098","title":"Improved off-policy training of diffusion samplers","display_name":"Improved off-policy training of diffusion samplers","publication_year":2024,"publication_date":"2024-02-07","ids":{"openalex":"https://openalex.org/W4391670448","doi":"https://doi.org/10.48550/arxiv.2402.05098"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.05098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05098","pdf_url":"https://arxiv.org/pdf/2402.05098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.05098","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023066991","display_name":"Marcin Sendera","orcid":"https://orcid.org/0000-0002-8741-6919"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sendera, Marcin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100343642","display_name":"Minsu Kim","orcid":"https://orcid.org/0000-0003-4472-0926"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Minsu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020059055","display_name":"Sarthak Mittal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mittal, Sarthak","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023596257","display_name":"Pablo Lemos","orcid":"https://orcid.org/0000-0002-4728-8473"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lemos, Pablo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090728849","display_name":"Luca Scimeca","orcid":"https://orcid.org/0000-0002-2821-0072"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scimeca, Luca","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041633236","display_name":"Jarrid Rector-Brooks","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rector-Brooks, Jarrid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039845061","display_name":"Alexandre Adam","orcid":"https://orcid.org/0000-0001-8806-7936"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adam, Alexandre","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086198262","display_name":"Yoshua Bengio","orcid":"https://orcid.org/0000-0002-9322-3515"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bengio, Yoshua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068089852","display_name":"Nikolay Malkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Malkin, Nikolay","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5023066991"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12100","display_name":"Advanced Mathematical Modeling in Engineering","score":0.9225000143051147,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12100","display_name":"Advanced Mathematical Modeling in Engineering","score":0.9225000143051147,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9204000234603882,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9160000085830688,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.8090179562568665},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6989307999610901},{"id":"https://openalex.org/keywords/amortized-analysis","display_name":"Amortized analysis","score":0.5518256425857544},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5301347970962524},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5087535977363586},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4584678113460541},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.34571659564971924},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20382237434387207},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1930864453315735},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.1587877869606018},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.07875320315361023},{"id":"https://openalex.org/keywords/marketing","display_name":"Marketing","score":0.061791688203811646}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.8090179562568665},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6989307999610901},{"id":"https://openalex.org/C142417499","wikidata":"https://www.wikidata.org/wiki/Q331716","display_name":"Amortized analysis","level":3,"score":0.5518256425857544},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5301347970962524},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5087535977363586},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4584678113460541},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.34571659564971924},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20382237434387207},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1930864453315735},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.1587877869606018},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.07875320315361023},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.061791688203811646},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"pmh:oai:arXiv.org:2402.05098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05098","pdf_url":"https://arxiv.org/pdf/2402.05098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:pure.ed.ac.uk:openaire/564a53c9-6e61-4737-ac1a-f3aadd15682c","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/files/476340745/SenderaEtalNeurIPS2024ImprovedOffPolicyTraining_accepted_vers_con_contrib_.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sendera, M, Kim, M, Mittal, S, Lemos, P, Scimeca, L, Rector-Brooks, J, Adam, A, Bengio, Y & Malkin, N 2024, Improved off-policy training of diffusion samplers. in A Globerson, L Mackey, D Belgrave, A Fan, U Paquet, J Tomczak & C Zhang (eds), Advances in Neural Information Processing Systems 37 (NeurIPS 2024) Main Conference Track. Advances in Neural Information Processing Systems, pp. 1-30, The Thirty-Eighth Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, 10/12/24. https://doi.org/10.48550/arXiv.2402.05098","raw_type":"contributionToPeriodical"},{"id":"pmh:oai:pure.ed.ac.uk:publications/564a53c9-6e61-4737-ac1a-f3aadd15682c","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/564a53c9-6e61-4737-ac1a-f3aadd15682c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sendera, M, Kim, M, Mittal, S, Lemos, P, Scimeca, L, Rector-Brooks, J, Adam, A, Bengio, Y & Malkin, N 2024, Improved off-policy training of diffusion samplers. in A Globerson, L Mackey, D Belgrave, A Fan, U Paquet, J Tomczak & C Zhang (eds), Advances in Neural Information Processing Systems 37 (NeurIPS 2024) Main Conference Track. Advances in Neural Information Processing Systems, pp. 1-30, The Thirty-Eighth Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, 10/12/24. https://doi.org/10.48550/arXiv.2402.05098","raw_type":"contributionToPeriodical"},{"id":"doi:10.48550/arxiv.2402.05098","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.05098","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.05098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05098","pdf_url":"https://arxiv.org/pdf/2402.05098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2165548363","display_name":null,"funder_award_id":"Canada","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320309949","display_name":"Canadian Institute for Advanced Research","ror":"https://ror.org/01sdtdd95"},{"id":"https://openalex.org/F4320322650","display_name":"Narodowym Centrum Nauki","ror":"https://ror.org/03ha2q922"},{"id":"https://openalex.org/F4320331257","display_name":"Alliance de recherche num\u00e9rique du Canada","ror":"https://ror.org/010r6td27"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"},{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391670448.pdf","grobid_xml":"https://content.openalex.org/works/W4391670448.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W2059640416","https://openalex.org/W1490753184","https://openalex.org/W2284465472","https://openalex.org/W2291782699","https://openalex.org/W1993948687","https://openalex.org/W2011676020","https://openalex.org/W2141466631"],"abstract_inverted_index":{"We":[0,21,58],"study":[1],"the":[2,43,73,77,88,101],"problem":[3],"of":[4,46,79,90,95],"training":[5],"diffusion":[6,119],"models":[7,120],"to":[8],"sample":[9],"from":[10,55],"a":[11,14,61,80,93,113],"distribution":[12],"with":[13,76],"given":[15],"unnormalized":[16],"density":[17],"or":[18],"energy":[19],"function.":[20],"benchmark":[22],"several":[23],"diffusion-structured":[24],"inference":[25],"methods,":[26,67],"including":[27],"simulation-based":[28],"variational":[29],"approaches":[30],"and":[31,83,104],"off-policy":[32,66],"methods":[33,103],"(continuous":[34],"generative":[35],"flow":[36],"networks).":[37],"Our":[38,98],"results":[39],"shed":[40],"light":[41],"on":[42,69,92,118],"relative":[44],"advantages":[45],"existing":[47],"algorithms":[48],"while":[49],"bringing":[50],"into":[51],"question":[52],"some":[53],"claims":[54],"past":[56],"work.":[57],"also":[59],"propose":[60],"novel":[62],"exploration":[63],"strategy":[64],"for":[65,100,115,121],"based":[68],"local":[70],"search":[71],"in":[72],"target":[74,96],"space":[75],"use":[78],"replay":[81],"buffer,":[82],"show":[84],"that":[85],"it":[86],"improves":[87],"quality":[89],"samples":[91],"variety":[94],"distributions.":[97],"code":[99],"sampling":[102],"benchmarks":[105],"studied":[106],"is":[107],"made":[108],"public":[109],"at":[110],"https://github.com/GFNOrg/gfn-diffusion":[111],"as":[112],"base":[114],"future":[116],"work":[117],"amortized":[122],"inference.":[123]},"counts_by_year":[],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2024-02-09T00:00:00"}
