{"id":"https://openalex.org/W7134839736","doi":"https://doi.org/10.48550/arxiv.2603.08111","title":"DeReCo: Decoupling Representation and Coordination Learning for Object-Adaptive Decentralized Multi-Robot Cooperative Transport","display_name":"DeReCo: Decoupling Representation and Coordination Learning for Object-Adaptive Decentralized Multi-Robot Cooperative Transport","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134839736","doi":"https://doi.org/10.48550/arxiv.2603.08111"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.08111","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073719311","display_name":"Kazuki Shibata","orcid":"https://orcid.org/0000-0003-0753-7663"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shibata, Kazuki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114761611","display_name":"Ryosuke Sota","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sota, Ryosuke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128655192","display_name":"Shandil Dhiresh Bosch","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bosch, Shandil Dhiresh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001325713","display_name":"Yuki Kadokawa","orcid":"https://orcid.org/0000-0003-3358-9520"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kadokawa, Yuki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128654235","display_name":"Tsurumine Yoshihisa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoshihisa, Tsurumine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128682240","display_name":"Takamitsu Matsubara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matsubara, Takamitsu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5365999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5365999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.21459999680519104,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.03440000116825104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.8393999934196472},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.708299994468689},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.6617000102996826},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.510200023651123},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4959999918937683},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.47200000286102295},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4528999924659729}],"concepts":[{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.8393999934196472},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.708299994468689},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6629999876022339},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.6617000102996826},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.510200023651123},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4959999918937683},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4659000039100647},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4528999924659729},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39320001006126404},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.32760000228881836},{"id":"https://openalex.org/C2780695315","wikidata":"https://www.wikidata.org/wiki/Q3799040","display_name":"Unobservable","level":2,"score":0.3262999951839447},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32499998807907104},{"id":"https://openalex.org/C107257861","wikidata":"https://www.wikidata.org/wiki/Q656316","display_name":"Coordination game","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.2743000090122223},{"id":"https://openalex.org/C2779110517","wikidata":"https://www.wikidata.org/wiki/Q1240788","display_name":"Supervisor","level":2,"score":0.25600001215934753}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.08111","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.08111","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08111","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.08111","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generalizing":[0],"decentralized":[1,18,159],"multi-robot":[2,116],"cooperative":[3,117],"transport":[4,127],"across":[5,124],"objects":[6,125,193,207],"with":[7,139,194],"diverse":[8],"shapes":[9,57],"and":[10,30,47,58,70,111,122,126,151,167,170,173,197,200],"physical":[11,59],"properties":[12,60],"remains":[13],"a":[14,104,131],"fundamental":[15],"challenge.":[16],"Under":[17],"execution,":[19],"two":[20,205],"key":[21],"challenges":[22],"arise:":[23],"object-dependent":[24,45,146],"representation":[25,69,90,110,166],"learning":[26,32,36,113,138,169],"under":[27,38,78],"partial":[28,79],"observability":[29,80],"coordination":[31,71,82,112,137,168],"in":[33,50,86,93,183,208],"multi-agent":[34],"reinforcement":[35],"(MARL)":[37],"non-stationarity.":[39],"A":[40],"typical":[41],"approach":[42],"jointly":[43],"optimizes":[44],"representations":[46,77,147],"coordinated":[48],"policies":[49],"an":[51],"end-to-end":[52],"manner":[53],"while":[54,84],"randomizing":[55],"object":[56,141],"during":[61],"training.":[62,95,175],"However,":[63],"this":[64,98],"joint":[65],"optimization":[66],"tightly":[67],"couples":[68],"learning,":[72,83,91],"introducing":[73],"bidirectional":[74],"interference:":[75],"inaccurate":[76],"destabilize":[81],"non-stationarity":[85],"MARL":[87,106],"further":[88],"degrades":[89],"resulting":[92],"sample-inefficient":[94],"To":[96],"address":[97],"structural":[99],"coupling,":[100],"we":[101],"propose":[102],"DeReCo,":[103],"novel":[105],"framework":[107],"that":[108,179],"decouples":[109],"for":[114,158],"object-adaptive":[115],"transport,":[118],"improving":[119],"sample":[120],"efficiency":[121],"generalization":[123],"scenarios.":[128],"DeReCo":[129,180],"adopts":[130],"three-stage":[132],"training":[133,187],"strategy:":[134],"(1)":[135],"centralized":[136],"privileged":[140,156],"information,":[142],"(2)":[143],"reconstruction":[144],"of":[145,155],"from":[148],"local":[149],"observations,":[150],"(3)":[152],"progressive":[153],"removal":[154],"information":[157],"execution.":[160],"This":[161],"decoupling":[162],"mitigates":[163],"interference":[164],"between":[165],"enables":[171],"stable":[172],"sample-efficient":[174],"Experimental":[176],"results":[177],"show":[178],"outperforms":[181],"baselines":[182],"simulation":[184],"on":[185,204],"three":[186],"objects,":[188],"generalizes":[189],"to":[190],"six":[191],"unseen":[192,206],"varying":[195],"masses":[196],"friction":[198],"coefficients,":[199],"achieves":[201],"superior":[202],"performance":[203],"real-robot":[209],"experiments.":[210]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-11T00:00:00"}
