{"id":"https://openalex.org/W7162545679","doi":"https://doi.org/10.48550/arxiv.2605.26637","title":"Enabling Extensible Embodied Capabilities with Tools","display_name":"Enabling Extensible Embodied Capabilities with Tools","publication_year":2026,"publication_date":"2026-05-26","ids":{"openalex":"https://openalex.org/W7162545679","doi":"https://doi.org/10.48550/arxiv.2605.26637"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.26637","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26637","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.26637","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137174876","display_name":"Xueyang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xueyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137094226","display_name":"Zijia Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zijia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137088938","display_name":"Qianjiang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Qianjiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137158581","display_name":"Yibo Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137177905","display_name":"Guiyao Tie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tie, Guiyao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137172832","display_name":"Li Wan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wan, Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137137864","display_name":"Yidan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yidan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137086963","display_name":"Pan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Pan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137090539","display_name":"Lichao Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Lichao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137086856","display_name":"Yongchao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yongchao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1462000012397766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1462000012397766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.14589999616146088,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11431","display_name":"Action Observation and Synchronization","score":0.12409999966621399,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.8733000159263611},{"id":"https://openalex.org/keywords/cognitive-robotics","display_name":"Cognitive robotics","score":0.5636000037193298},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5444999933242798},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5098000168800354},{"id":"https://openalex.org/keywords/externalization","display_name":"Externalization","score":0.4916999936103821},{"id":"https://openalex.org/keywords/embodied-agent","display_name":"Embodied agent","score":0.4846999943256378},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4339999854564667}],"concepts":[{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.8733000159263611},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7085000276565552},{"id":"https://openalex.org/C192327766","wikidata":"https://www.wikidata.org/wiki/Q1038799","display_name":"Cognitive robotics","level":3,"score":0.5636000037193298},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5444999933242798},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5098000168800354},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.49570000171661377},{"id":"https://openalex.org/C2779379281","wikidata":"https://www.wikidata.org/wiki/Q61895854","display_name":"Externalization","level":2,"score":0.4916999936103821},{"id":"https://openalex.org/C103683099","wikidata":"https://www.wikidata.org/wiki/Q5370102","display_name":"Embodied agent","level":3,"score":0.4846999943256378},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4339999854564667},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.4178999960422516},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.3628999888896942},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3336000144481659},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3125},{"id":"https://openalex.org/C32833848","wikidata":"https://www.wikidata.org/wiki/Q4115054","display_name":"Extensibility","level":2,"score":0.2953000068664551},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2849000096321106},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2849000096321106},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.27090001106262207},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.26269999146461487}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.26637","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26637","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.26637","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26637","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Most":[0],"existing":[1],"embodied":[2,68,103,134,185],"intelligence":[3],"methods":[4],"formulate":[5],"perception,":[6,81],"reasoning,":[7,83],"planning,":[8],"and":[9,22,30,73,75,84,105,119,125,141,155,171],"control":[10],"within":[11,32],"a":[12,33,38,64,147,177,189],"unified":[13],"parameterized":[14],"policy.":[15],"Yet":[16],"these":[17],"capabilities":[18,45],"are":[19,151,158],"inherently":[20],"hierarchical":[21],"heterogeneous,":[23],"making":[24],"them":[25],"difficult":[26],"to":[27,96,173],"reliably":[28],"learn":[29],"modularize":[31],"single":[34],"model.":[35],"We":[36],"propose":[37],"capability":[39,130],"externalization":[40,131],"approach":[41],"that":[42,129,167],"decouples":[43],"heterogeneous":[44],"into":[46],"independently":[47],"optimized":[48],"tools,":[49],"dynamically":[50],"invoked":[51],"at":[52],"inference":[53],"time.":[54],"To":[55],"this":[56],"end,":[57],"we":[58,93],"introduce":[59],"Embodied":[60],"Tool":[61],"Protocol":[62],"(ETP),":[63],"standardized":[65],"protocol":[66],"for":[67,153,160,192],"tool":[69,88,100,115,117,186],"registration,":[70],"discovery,":[71],"invocation,":[72],"execution,":[74,118],"curate":[76],"100+":[77],"validated":[78],"tools":[79,111,175],"spanning":[80],"cognition,":[82],"execution":[85],"as":[86,188],"the":[87],"base.":[89],"Building":[90],"on":[91,139,143],"this,":[92],"construct":[94],"EmbodiedToolBench":[95],"evaluate":[97],"both":[98],"whether":[99],"augmentation":[101],"improves":[102,133],"performance":[104,135],"how":[106,172],"well":[107],"current":[108],"models":[109],"use":[110],"across":[112,123,180],"tool-necessity":[113],"recognition,":[114],"selection,":[116],"tool-chain":[120],"composition.":[121],"Experiments":[122],"simulation":[124],"real-world":[126],"platforms":[127],"confirm":[128],"consistently":[132],"(avg.":[136],"gain":[137],"31%":[138],"EB-ALFRED":[140],"36%":[142],"EB-Navigation),":[144],"yet":[145],"reveal":[146],"clear":[148],"boundary:":[149],"gains":[150],"substantial":[152],"cognition":[154],"perception":[156],"but":[157],"limited":[159],"execution-type":[161],"capabilities.":[162],"Moreover,":[163],"our":[164],"analysis":[165],"reveals":[166],"knowing":[168],"when,":[169],"which,":[170],"invoke":[174],"remains":[176],"persistent":[178],"challenge":[179],"all":[181],"models,":[182],"thereby":[183],"highlighting":[184],"competence":[187],"critical":[190],"direction":[191],"future":[193],"research.":[194]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
