{"id":"https://openalex.org/W4413944786","doi":"https://doi.org/10.1109/icra55743.2025.11127873","title":"Embodiment-agnostic Action Planning via Object-Part Scene Flow","display_name":"Embodiment-agnostic Action Planning via Object-Part Scene Flow","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413944786","doi":"https://doi.org/10.1109/icra55743.2025.11127873"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11127873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127873","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034309002","display_name":"Weiliang Tang","orcid":"https://orcid.org/0009-0007-5794-858X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weiliang Tang","raw_affiliation_strings":["Chinese University of Hong Kong,Department of Computer Science and Engineering"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong,Department of Computer Science and Engineering","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023225646","display_name":"Jiahui Pan","orcid":"https://orcid.org/0000-0002-7576-6743"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia-Hui Pan","raw_affiliation_strings":["Chinese University of Hong Kong,Department of Computer Science and Engineering"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong,Department of Computer Science and Engineering","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021239979","display_name":"Wei Zhan","orcid":"https://orcid.org/0000-0002-7167-6353"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wei Zhan","raw_affiliation_strings":["UC Berkeley,The Department of Mechanical Engineering"],"affiliations":[{"raw_affiliation_string":"UC Berkeley,The Department of Mechanical Engineering","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005976047","display_name":"Jianshu Zhou","orcid":"https://orcid.org/0000-0003-3900-3519"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jianshu Zhou","raw_affiliation_strings":["UC Berkeley,The Department of Mechanical Engineering"],"affiliations":[{"raw_affiliation_string":"UC Berkeley,The Department of Mechanical Engineering","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051534896","display_name":"Huaxiu Yao","orcid":"https://orcid.org/0000-0002-8691-9629"},"institutions":[{"id":"https://openalex.org/I1333535994","display_name":"University of North Carolina Health Care","ror":"https://ror.org/00qz24g20","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1333535994"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huaxiu Yao","raw_affiliation_strings":["UNC-Chapel Hill,The Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"UNC-Chapel Hill,The Department of Computer Science","institution_ids":["https://openalex.org/I1333535994"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100707660","display_name":"Yunhui Liu","orcid":"https://orcid.org/0000-0002-3625-6679"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun-Hui Liu","raw_affiliation_strings":["The Chinese University of Hong Kong,The Department of Mechanical and Automation Engineering"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong,The Department of Mechanical and Automation Engineering","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064077634","display_name":"Masayoshi Tomizuka","orcid":"https://orcid.org/0000-0003-0206-6639"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Masayoshi Tomizuka","raw_affiliation_strings":["UC Berkeley,The Department of Mechanical Engineering"],"affiliations":[{"raw_affiliation_string":"UC Berkeley,The Department of Mechanical Engineering","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022382771","display_name":"Mingyu Ding","orcid":"https://orcid.org/0000-0001-6556-8359"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingyu Ding","raw_affiliation_strings":["UC Berkeley,The Department of Mechanical Engineering"],"affiliations":[{"raw_affiliation_string":"UC Berkeley,The Department of Mechanical Engineering","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054382056","display_name":"Chi\u2010Wing Fu","orcid":"https://orcid.org/0000-0002-5238-593X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chi-Wing Fu","raw_affiliation_strings":["Chinese University of Hong Kong,Department of Computer Science and Engineering"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong,Department of Computer Science and Engineering","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5034309002"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35448965,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2086","last_page":"2093"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9696000218391418,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.734789252281189},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6404030919075012},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.615889310836792},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4898507297039032},{"id":"https://openalex.org/keywords/flow","display_name":"Flow (mathematics)","score":0.4844651222229004},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.47980430722236633},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.40299472212791443},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06613439321517944}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.734789252281189},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6404030919075012},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.615889310836792},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4898507297039032},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.4844651222229004},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47980430722236633},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40299472212791443},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06613439321517944},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11127873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127873","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2194775991","https://openalex.org/W2443711627","https://openalex.org/W2528489519","https://openalex.org/W2625731136","https://openalex.org/W2769112066","https://openalex.org/W2962737955","https://openalex.org/W2963802910","https://openalex.org/W2964191259","https://openalex.org/W3004396697","https://openalex.org/W3038298277","https://openalex.org/W3122520957","https://openalex.org/W3132708124","https://openalex.org/W3134939669","https://openalex.org/W3204657926","https://openalex.org/W4312631723","https://openalex.org/W4312769771","https://openalex.org/W4312903454","https://openalex.org/W4385403811","https://openalex.org/W4385430451","https://openalex.org/W4385430685","https://openalex.org/W4386065350","https://openalex.org/W4402354112","https://openalex.org/W4402754134","https://openalex.org/W4403888324","https://openalex.org/W4403906568","https://openalex.org/W4405785673"],"related_works":["https://openalex.org/W2737719445","https://openalex.org/W2898210368","https://openalex.org/W4239098401","https://openalex.org/W2382480268","https://openalex.org/W1976518449","https://openalex.org/W2732837990","https://openalex.org/W2755342338","https://openalex.org/W2363366881","https://openalex.org/W2779427294","https://openalex.org/W2604548540"],"abstract_inverted_index":{"Observing":[0],"that":[1,51,171],"the":[2,11,21,28,39,54,69,105,108,133,157],"key":[3],"for":[4,42,107,135],"robotic":[5],"action":[6,40,56],"planning":[7],"is":[8,18,50,81],"to":[9,26,37,90,103,111,117,126,182],"understand":[10],"target-object":[12],"motion":[13,60],"when":[14],"its":[15,35],"associated":[16],"part":[17,106],"manipulated":[19],"by":[20,67,152],"end":[22,109],"effector,":[23],"we":[24,166],"propose":[25],"generate":[27],"3D":[29],"object-part":[30,101],"scene":[31],"flow":[32],"and":[33,87,122,131,154,162],"extract":[34,127],"transformations":[36],"solve":[38,132],"trajectories":[41],"diverse":[43,85,136],"embodiments.":[44,137,184],"The":[45],"advantage":[46],"of":[47],"our":[48,79,145,172],"approach":[49],"it":[52],"derives":[53],"robot":[55],"explicitly":[57],"from":[58,92],"object":[59,70],"prediction,":[61],"yielding":[62],"a":[63,123],"more":[64],"robust":[65],"policy":[66],"understanding":[68],"motions.":[71],"Also,":[72],"beyond":[73],"policies":[74],"trained":[75,174],"on":[76,139,156],"embodiment-centric":[77],"data,":[78,144],"method":[80,96,146],"embodiment-agnostic,":[82],"generalizable":[83],"across":[84],"embodiments,":[86],"being":[88],"able":[89],"learn":[91],"human":[93,177],"demonstrations.":[94],"Our":[95],"comprises":[97],"three":[98],"components:":[99],"an":[100,113],"predictor":[102],"locate":[104],"effector":[110],"manipulate,":[112],"RGBD":[114,120],"video":[115],"generator":[116],"predict":[118],"future":[119],"videos,":[121],"trajectory":[124,134,143],"planner":[125],"embodiment-agnostic":[128],"transformation":[129],"sequences":[130],"Trained":[138],"videos":[140],"even":[141],"without":[142],"still":[147],"outperforms":[148],"existing":[149],"works":[150],"significantly":[151],"27.7%":[153],"26.2%":[155],"prevailing":[158],"virtual":[159],"environments":[160],"MetaWorld":[161],"Franka-Kitchen,":[163],"respectively.":[164],"Furthermore,":[165],"conducted":[167],"real-world":[168],"experiments,":[169],"showing":[170],"policy,":[173],"only":[175],"with":[176],"demonstration,":[178],"can":[179],"be":[180],"deployed":[181],"various":[183]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
