{"id":"https://openalex.org/W4323651335","doi":"https://doi.org/10.48550/arxiv.2303.04137","title":"Diffusion Policy: Visuomotor Policy Learning via Action Diffusion","display_name":"Diffusion Policy: Visuomotor Policy Learning via Action Diffusion","publication_year":2023,"publication_date":"2023-03-07","ids":{"openalex":"https://openalex.org/W4323651335","doi":"https://doi.org/10.48550/arxiv.2303.04137"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2303.04137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2303.04137","pdf_url":"https://arxiv.org/pdf/2303.04137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2303.04137","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101510130","display_name":"Cheng Chi","orcid":"https://orcid.org/0000-0001-9143-7125"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chi, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101340675","display_name":"Zhenjia Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zhenjia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053373302","display_name":"Siyuan Feng","orcid":"https://orcid.org/0000-0003-2531-8480"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Siyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085247461","display_name":"Eric Cousineau","orcid":"https://orcid.org/0000-0002-5056-8046"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cousineau, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101182304","display_name":"Yilun Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Yilun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091048694","display_name":"Benjamin Burchfiel","orcid":"https://orcid.org/0000-0001-7332-6712"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Burchfiel, Benjamin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Tedrake, Russ","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tedrake, Russ","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5004644695","display_name":"Shuran Song","orcid":"https://orcid.org/0000-0002-8768-7356"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Shuran","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101510130"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9743000268936157,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9348000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6844930648803711},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6094998717308044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5723423361778259},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5640529990196228},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5115031003952026},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4549247622489929},{"id":"https://openalex.org/keywords/diffusion-process","display_name":"Diffusion process","score":0.43447232246398926}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6844930648803711},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6094998717308044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5723423361778259},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5640529990196228},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5115031003952026},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4549247622489929},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.43447232246398926},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.0},{"id":"https://openalex.org/C3017618536","wikidata":"https://www.wikidata.org/wiki/Q304994","display_name":"Innovation diffusion","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2303.04137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2303.04137","pdf_url":"https://arxiv.org/pdf/2303.04137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2303.04137","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2303.04137","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2303.04137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2303.04137","pdf_url":"https://arxiv.org/pdf/2303.04137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G2783609121","display_name":null,"funder_award_id":"2037101","funder_id":"https://openalex.org/F4320337391","funder_display_name":"Division of Civil, Mechanical and Manufacturing Innovation"},{"id":"https://openalex.org/G3947485538","display_name":null,"funder_award_id":"CMMI-2037101","funder_id":"https://openalex.org/F4320337391","funder_display_name":"Division of Civil, Mechanical and Manufacturing Innovation"},{"id":"https://openalex.org/G5954070948","display_name":null,"funder_award_id":"CMMI-","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6081519054","display_name":null,"funder_award_id":"2037101","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6852655174","display_name":null,"funder_award_id":"CMMI-2037101","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7360523541","display_name":null,"funder_award_id":"IIS-2132519","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8365859440","display_name":null,"funder_award_id":"2132519","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null},{"id":"https://openalex.org/F4320337391","display_name":"Division of Civil, Mechanical and Manufacturing Innovation","ror":"https://ror.org/028yd4c30"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4323651335.pdf","grobid_xml":"https://content.openalex.org/works/W4323651335.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W2768698792"],"abstract_inverted_index":{"This":[0],"paper":[1,131],"introduces":[2],"Diffusion":[3,26,55],"Policy,":[4],"a":[5,14,19,77,133,160],"new":[6,161],"way":[7],"of":[8,53,60,79,120,135,142,163,177],"generating":[9],"robot":[10,35,46,96],"behavior":[11],"by":[12],"representing":[13],"robot's":[15],"visuomotor":[16,124],"policy":[17,125,164],"as":[18],"conditional":[20],"denoising":[21],"diffusion":[22,88,121,151,178],"process.":[23],"We":[24,84,153],"benchmark":[25],"Policy":[27,56],"across":[28],"12":[29],"different":[30,34],"tasks":[31],"from":[32],"4":[33],"manipulation":[36],"benchmarks":[37],"and":[38,65,110,148,182],"find":[39,85],"that":[40,86,167],"it":[41],"consistently":[42],"outperforms":[43],"existing":[44],"state-of-the-art":[45],"learning":[47,126,165],"methods":[48],"with":[49,68],"an":[50],"average":[51],"improvement":[52],"46.9%.":[54],"learns":[57],"the":[58,61,87,118,140,149,172],"gradient":[59,72],"action-distribution":[62],"score":[63],"function":[64],"iteratively":[66],"optimizes":[67],"respect":[69],"to":[70,170],"this":[71,130,155],"field":[73],"during":[74],"inference":[75],"via":[76],"series":[78],"stochastic":[80],"Langevin":[81],"dynamics":[82],"steps.":[83],"formulation":[89],"yields":[90],"powerful":[91,173],"advantages":[92],"when":[93],"used":[94],"for":[95,106,123],"policies,":[97],"including":[98,139],"gracefully":[99],"handling":[100],"multimodal":[101],"action":[102,108],"distributions,":[103],"being":[104],"suitable":[105],"high-dimensional":[107],"spaces,":[109],"exhibiting":[111],"impressive":[112],"training":[113,183],"stability.":[114],"To":[115],"fully":[116],"unlock":[117],"potential":[119],"models":[122],"on":[127],"physical":[128],"robots,":[129],"presents":[132],"set":[134],"key":[136],"technical":[137],"contributions":[138],"incorporation":[141],"receding":[143],"horizon":[144],"control,":[145],"visual":[146],"conditioning,":[147],"time-series":[150],"transformer.":[152],"hope":[154],"work":[156],"will":[157],"help":[158],"motivate":[159],"generation":[162],"techniques":[166],"are":[168],"able":[169],"leverage":[171],"generative":[174],"modeling":[175],"capabilities":[176],"models.":[179],"Code,":[180],"data,":[181],"details":[184],"is":[185],"publicly":[186],"available":[187],"diffusion-policy.cs.columbia.edu":[188]},"counts_by_year":[{"year":2025,"cited_by_count":11},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
