{"id":"https://openalex.org/W7139130003","doi":"https://doi.org/10.48550/arxiv.2603.16861","title":"MolmoB0T: Large-Scale Simulation Enables Zero-Shot Manipulation","display_name":"MolmoB0T: Large-Scale Simulation Enables Zero-Shot Manipulation","publication_year":2026,"publication_date":"2026-03-17","ids":{"openalex":"https://openalex.org/W7139130003","doi":"https://doi.org/10.48550/arxiv.2603.16861"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16861","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16861","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16861","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130113487","display_name":"Abhay Deshpande","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Deshpande, Abhay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125938065","display_name":"Maya Guru","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guru, Maya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129793549","display_name":"Rose Hendrix","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hendrix, Rose","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129930396","display_name":"Snehal Jauhri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jauhri, Snehal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004894291","display_name":"Ainaz Eftekhar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eftekhar, Ainaz","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108711709","display_name":"Rohun Tripathi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tripathi, Rohun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023640000","display_name":"Max Argus","orcid":"https://orcid.org/0000-0002-1288-7476"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Argus, Max","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125931455","display_name":"Jordi Salvador","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Salvador, Jordi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085879597","display_name":"Haoquan Fang","orcid":"https://orcid.org/0009-0007-9759-3867"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Haoquan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035949823","display_name":"Matthew Wallingford","orcid":"https://orcid.org/0000-0002-6797-9802"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wallingford, Matthew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093931955","display_name":"Wilbert Pumacay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pumacay, Wilbert","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129839630","display_name":"Yejin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Yejin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5098954582","display_name":"Quinn Pfeifer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pfeifer, Quinn","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125941368","display_name":"Ying-Chun Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Ying-Chun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129920921","display_name":"Piper Wolters","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wolters, Piper","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130209075","display_name":"Omar Rayyan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rayyan, Omar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129985824","display_name":"Mingtong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Mingtong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027184297","display_name":"Jiafei Duan","orcid":"https://orcid.org/0000-0003-4551-2424"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Duan, Jiafei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130055657","display_name":"Karen Farley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farley, Karen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129823701","display_name":"Winson Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Winson","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129970081","display_name":"Eli Vanderbilt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vanderbilt, Eli","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130146151","display_name":"Dieter Fox","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fox, Dieter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129880362","display_name":"Ali Farhadi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farhadi, Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026055366","display_name":"Georgia Chalvatzaki","orcid":"https://orcid.org/0000-0002-5055-199X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chalvatzaki, Georgia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129905048","display_name":"Dhruv Shah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shah, Dhruv","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129780984","display_name":"Ranjay Krishna","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishna, Ranjay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":26,"corresponding_author_ids":["https://openalex.org/A5130113487"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.38659998774528503,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.38659998774528503,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.3027999997138977,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.10000000149011612,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.608299970626831},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.5292999744415283},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.4875999987125397},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.47540000081062317},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4269999861717224},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4122999906539917},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.39100000262260437},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.38690000772476196}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.777400016784668},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.608299970626831},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.579200029373169},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5292999744415283},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.4875999987125397},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.47540000081062317},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4269999861717224},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4122999906539917},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4009999930858612},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.39100000262260437},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.38690000772476196},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3625999987125397},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3174000084400177},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.27720001339912415},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.25200000405311584},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16861","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16861","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16861","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16861","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"A":[0],"prevailing":[1],"view":[2],"in":[3,91,206],"robot":[4],"learning":[5],"is":[6,10,16,61],"that":[7,41,54,220,234],"simulation":[8],"alone":[9],"not":[11,62],"enough;":[12],"effective":[13,66],"sim-to-real":[14],"transfer":[15,56,190],"widely":[17],"believed":[18],"to":[19,30,57,134,149,191,237],"require":[20],"at":[21,215],"least":[22],"some":[23],"real-world":[24,184],"data":[25,82],"collection":[26],"or":[27],"task-specific":[28],"fine-tuning":[29],"bridge":[31],"the":[32,58,131,158,166,238],"gap":[33],"between":[34],"simulated":[35,48,89],"and":[36,46,70,87,109,138,147,165,179,194],"physical":[37],"environments.":[38,195],"We":[39,73,112,152],"challenge":[40],"assumption.":[42],"With":[43,93],"sufficiently":[44],"large-scale":[45],"diverse":[47,88,226],"synthetic":[49],"training":[50],"data,":[51],"we":[52,95],"show":[53],"zero-shot":[55,189],"real":[59,207,239],"world":[60,208],"only":[63],"possible,":[64],"but":[65],"for":[67,80,105,144,161,172],"both":[68],"static":[69],"mobile":[71,170,180],"manipulation.":[72],"introduce":[74],"MolmoBot-Engine,":[75],"a":[76,98,118,124,140,201],"fully":[77],"open-source":[78],"pipeline":[79],"procedural":[81,221],"generation":[83,223],"across":[84,210],"robots,":[85],"tasks,":[86],"environments":[90],"MolmoSpaces.":[92],"it,":[94],"release":[96],"MolmoBot-Data,":[97],"dataset":[99],"of":[100,204],"1.8":[101],"million":[102],"expert":[103],"trajectories":[104],"articulated":[106,227],"object":[107],"manipulation":[108,163,232],"pick-and-place":[110],"tasks.":[111],"train":[113],"three":[114],"policy":[115,142],"classes:":[116],"MolmoBot,":[117],"Molmo2-based":[119],"multi-frame":[120],"vision-language":[121],"model":[122],"with":[123,225],"flow-matching":[125],"action":[126],"head;":[127],"MolmoBot-Pi0,":[128],"which":[129],"replicates":[130],"$\u03c0_0$":[132],"architecture":[133],"enable":[135],"direct":[136],"comparison;":[137],"MolmoBot-SPOC,":[139],"lightweight":[141],"suitable":[143],"edge":[145],"deployment":[146],"amenable":[148],"RL":[150],"fine-tuning.":[151],"evaluate":[153],"on":[154],"two":[155],"robotic":[156],"platforms:":[157],"Franka":[159],"FR3":[160],"tabletop":[162,197],"tasks":[164],"Rainbow":[167],"Robotics":[168],"RB-Y1":[169],"manipulator":[171],"door":[173],"opening,":[174],"drawer":[175],"manipulation,":[176],"cabinet":[177],"interaction,":[178],"pick-and-place.":[181],"Without":[182],"any":[183],"fine-tuning,":[185],"our":[186],"policies":[187,233],"achieve":[188],"unseen":[192],"objects":[193],"On":[196],"pick-and-place,":[198],"MolmoBot":[199],"achieves":[200],"success":[202],"rate":[203],"79.2%":[205],"evaluations":[209],"4":[211],"settings,":[212],"outperforming":[213],"$\u03c0_{0.5}$":[214],"39.2%.":[216],"Our":[217],"results":[218],"demonstrate":[219],"environment":[222],"combined":[224],"assets":[228],"can":[229],"produce":[230],"robust":[231],"generalize":[235],"broadly":[236],"world.":[240],"Technical":[241],"website:":[242],"https://allenai.github.io/MolmoBot":[243]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-20T00:00:00"}
