{"id":"https://openalex.org/W4401415110","doi":"https://doi.org/10.1109/icra57147.2024.10611220","title":"Dream2Real: Zero-Shot 3D Object Rearrangement with Vision-Language Models","display_name":"Dream2Real: Zero-Shot 3D Object Rearrangement with Vision-Language Models","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4401415110","doi":"https://doi.org/10.1109/icra57147.2024.10611220"},"language":"en","primary_location":{"id":"doi:10.1109/icra57147.2024.10611220","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611220","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058833302","display_name":"Ivan Kapelyukh","orcid":"https://orcid.org/0000-0001-5587-204X"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Ivan Kapelyukh","raw_affiliation_strings":["The Robot Learning Lab at Imperial College,London"],"affiliations":[{"raw_affiliation_string":"The Robot Learning Lab at Imperial College,London","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086831854","display_name":"Yifei Ren","orcid":"https://orcid.org/0000-0001-9306-1678"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yifei Ren","raw_affiliation_strings":["The Robot Learning Lab at Imperial College,London"],"affiliations":[{"raw_affiliation_string":"The Robot Learning Lab at Imperial College,London","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044506939","display_name":"Ignacio Alzugaray","orcid":"https://orcid.org/0000-0002-7121-0000"},"institutions":[{"id":"https://openalex.org/I4210089887","display_name":"Dyson (United Kingdom)","ror":"https://ror.org/00a4npp83","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210089887"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ignacio Alzugaray","raw_affiliation_strings":["The Dyson Robotics Lab"],"affiliations":[{"raw_affiliation_string":"The Dyson Robotics Lab","institution_ids":["https://openalex.org/I4210089887"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080385974","display_name":"Edward Johns","orcid":"https://orcid.org/0000-0002-8914-8786"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Edward Johns","raw_affiliation_strings":["The Robot Learning Lab at Imperial College,London"],"affiliations":[{"raw_affiliation_string":"The Robot Learning Lab at Imperial College,London","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5058833302"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":null,"apc_paid":null,"fwci":3.9182,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.94775897,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"4796","last_page":"4803"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.636595606803894},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5617689490318298},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5486810207366943},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.518587589263916},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4831683039665222},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.4336540102958679},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.18016791343688965},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.130226731300354},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07589998841285706}],"concepts":[{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.636595606803894},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5617689490318298},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5486810207366943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.518587589263916},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4831683039665222},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.4336540102958679},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.18016791343688965},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.130226731300354},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07589998841285706},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra57147.2024.10611220","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611220","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7999120326","display_name":null,"funder_award_id":"EP/S036636/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W1515145374","https://openalex.org/W2009422376","https://openalex.org/W2016435525","https://openalex.org/W2141664020","https://openalex.org/W2786036844","https://openalex.org/W2914944935","https://openalex.org/W3097484130","https://openalex.org/W3176368002","https://openalex.org/W3206916018","https://openalex.org/W4200150166","https://openalex.org/W4221151978","https://openalex.org/W4224912544","https://openalex.org/W4226088469","https://openalex.org/W4226344024","https://openalex.org/W4311428907","https://openalex.org/W4312396403","https://openalex.org/W4312407972","https://openalex.org/W4312594400","https://openalex.org/W4312807436","https://openalex.org/W4312971576","https://openalex.org/W4318718936","https://openalex.org/W4367721889","https://openalex.org/W4379260839","https://openalex.org/W4380993732","https://openalex.org/W4383066118","https://openalex.org/W4383109488","https://openalex.org/W4383994326","https://openalex.org/W4385403813","https://openalex.org/W4385403849","https://openalex.org/W4385430538","https://openalex.org/W4385430588","https://openalex.org/W4385430678","https://openalex.org/W4385431115","https://openalex.org/W4385473486","https://openalex.org/W4385965471","https://openalex.org/W4386075953","https://openalex.org/W4386076018","https://openalex.org/W4386874741","https://openalex.org/W4388720459","https://openalex.org/W4389665359","https://openalex.org/W4389667789","https://openalex.org/W4390873331","https://openalex.org/W4390874575","https://openalex.org/W4401246959","https://openalex.org/W4401415428","https://openalex.org/W6747827861","https://openalex.org/W6784840303","https://openalex.org/W6785308759","https://openalex.org/W6791353385","https://openalex.org/W6800497432","https://openalex.org/W6801810553","https://openalex.org/W6803928713","https://openalex.org/W6809898026","https://openalex.org/W6810327023","https://openalex.org/W6810640255","https://openalex.org/W6839095836","https://openalex.org/W6841082114","https://openalex.org/W6845354634","https://openalex.org/W6846020498","https://openalex.org/W6847274768","https://openalex.org/W6847590248","https://openalex.org/W6849177959","https://openalex.org/W6853053110","https://openalex.org/W6853664340","https://openalex.org/W6853982971","https://openalex.org/W6854738657","https://openalex.org/W6854929498","https://openalex.org/W6855158220","https://openalex.org/W6858297711"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"We":[0],"introduce":[1],"Dream2Real,":[2],"a":[3,16,29,54,88,96],"robotics":[4],"framework":[5,104],"which":[6,60],"integrates":[7],"vision-language":[8],"models":[9],"(VLMs)":[10],"trained":[11],"on":[12,95,131],"2D":[13],"data":[14],"into":[15],"3D":[17,30],"object":[18],"rearrangement":[19,79,126],"pipeline.":[20],"This":[21,76],"is":[22,66,105],"achieved":[23],"by":[24,53,110],"the":[25,33,45,58,63,71],"robot":[26],"autonomously":[27],"constructing":[28],"representation":[31],"of":[32,44,91,98,113],"scene,":[34],"where":[35],"objects":[36],"can":[37],"be":[38,81],"rearranged":[39],"virtually":[40],"and":[41,68,118,124],"an":[42],"image":[43],"resulting":[46],"arrangement":[47,59],"rendered.":[48],"These":[49],"renders":[50],"are":[51,129],"evaluated":[52],"VLM,":[55],"so":[56],"that":[57,102],"best":[61],"satisfies":[62],"user":[64],"instruction":[65],"selected":[67],"recreated":[69],"in":[70],"real":[72],"world":[73],"with":[74],"pick-and-place.":[75],"enables":[77],"language-conditioned":[78],"to":[80,86,107,121],"performed":[82],"zero-shot,":[83],"without":[84],"needing":[85],"collect":[87],"training":[89],"dataset":[90],"example":[92],"arrangements.":[93],"Results":[94],"series":[97],"real-world":[99],"tasks":[100],"show":[101],"this":[103],"robust":[106],"distractors,":[108],"controllable":[109],"language,":[111],"capable":[112],"understanding":[114],"complex":[115],"multi-object":[116],"relations,":[117],"readily":[119],"applicable":[120],"both":[122],"tabletop":[123],"6-DoF":[125],"tasks.":[127],"Videos":[128],"available":[130],"our":[132],"webpage":[133],"at:":[134],"https://www.robot-learning.uk/dream2real.":[135]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-01T08:55:55.761014","created_date":"2025-10-10T00:00:00"}
