{"id":"https://openalex.org/W7130584412","doi":"https://doi.org/10.48550/arxiv.2602.16356","title":"Articulated 3D Scene Graphs for Open-World Mobile Manipulation","display_name":"Articulated 3D Scene Graphs for Open-World Mobile Manipulation","publication_year":2026,"publication_date":"2026-02-18","ids":{"openalex":"https://openalex.org/W7130584412","doi":"https://doi.org/10.48550/arxiv.2602.16356"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.16356","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002929602","display_name":"Martin B\u00fcchner","orcid":"https://orcid.org/0000-0001-8725-1213"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"B\u00fcchner, Martin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007336076","display_name":"Adrian R\u00f6fer","orcid":"https://orcid.org/0000-0001-6132-0989"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"R\u00f6fer, Adrian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114400007","display_name":"Tim Engelbracht","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Engelbracht, Tim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084779517","display_name":"Tim Welschehold","orcid":"https://orcid.org/0000-0003-1163-4992"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Welschehold, Tim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062464940","display_name":"Zuria Bauer","orcid":"https://orcid.org/0000-0001-8447-2344"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bauer, Zuria","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122849832","display_name":"Hermann Blum","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Blum, Hermann","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126372334","display_name":"Marc Pollefeys","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pollefeys, Marc","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5114637789","display_name":"Abhinav Valada","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Valada, Abhinav","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5002929602"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.48420000076293945,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.48420000076293945,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1768999993801117,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.08020000159740448,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6140000224113464},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.4648999869823456},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4620000123977661},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.44359999895095825},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.44200000166893005},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.3865000009536743},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.3817000091075897},{"id":"https://openalex.org/keywords/revolute-joint","display_name":"Revolute joint","score":0.3553999960422516},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.3515999913215637}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7400000095367432},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6391000151634216},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6140000224113464},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.588100016117096},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.4648999869823456},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4620000123977661},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.44359999895095825},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.44200000166893005},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.3865000009536743},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3817000091075897},{"id":"https://openalex.org/C5643039","wikidata":"https://www.wikidata.org/wiki/Q3819341","display_name":"Revolute joint","level":3,"score":0.3553999960422516},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3515999913215637},{"id":"https://openalex.org/C20894473","wikidata":"https://www.wikidata.org/wiki/Q1116105","display_name":"Object model","level":3,"score":0.3495999872684479},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.34950000047683716},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.34929999709129333},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3325999975204468},{"id":"https://openalex.org/C179372163","wikidata":"https://www.wikidata.org/wiki/Q1406181","display_name":"Scene graph","level":3,"score":0.33160001039505005},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.32919999957084656},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.322299987077713},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.3109999895095825},{"id":"https://openalex.org/C2779337067","wikidata":"https://www.wikidata.org/wiki/Q4800961","display_name":"Articulation (sociology)","level":3,"score":0.30970001220703125},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C58581272","wikidata":"https://www.wikidata.org/wiki/Q12741163","display_name":"Workspace","level":3,"score":0.3034999966621399},{"id":"https://openalex.org/C53073257","wikidata":"https://www.wikidata.org/wiki/Q7075021","display_name":"Object-oriented design","level":3,"score":0.2989000082015991},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.26750001311302185},{"id":"https://openalex.org/C190727649","wikidata":"https://www.wikidata.org/wiki/Q1941532","display_name":"Mobile manipulator","level":4,"score":0.2624000012874603},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C2778775528","wikidata":"https://www.wikidata.org/wiki/Q5135432","display_name":"Closing (real estate)","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.16356","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.16356","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.16356","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.16356","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.4296756684780121}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Semantics":[0],"has":[1],"enabled":[2],"3D":[3,50,88],"scene":[4,51,202],"understanding":[5],"and":[6,36,74,89,104,120,163,178,194,217],"affordance-driven":[7],"object":[8,67,72,76,144,151,161],"interaction.":[9],"However,":[10],"robots":[11],"operating":[12],"in":[13,108,210],"real-world":[14,188],"environments":[15],"face":[16],"a":[17,44,57,94,109,192,195],"critical":[18],"limitation:":[19],"they":[20],"cannot":[21],"anticipate":[22],"how":[23],"objects":[24,116,123,209],"move.":[25],"Long-horizon":[26],"mobile":[27,196],"manipulation":[28,206],"requires":[29],"closing":[30],"the":[31,136,171],"gap":[32],"between":[33],"semantics,":[34],"geometry,":[35],"kinematics.":[37],"In":[38,186],"this":[39],"work,":[40],"we":[41,69,114],"present":[42],"MoMa-SG,":[43],"novel":[45,95,137],"framework":[46],"for":[47],"building":[48],"semantic-kinematic":[49,201],"graphs":[52,203],"of":[53,59,173,183,207],"articulated":[54,208],"scenes":[55],"containing":[56,65,159],"myriad":[58],"interactable":[60],"objects.":[61],"Given":[62],"RGB-D":[63,157],"sequences":[64,158],"multiple":[66],"articulations,":[68],"temporally":[70],"segment":[71],"interactions":[73,162],"infer":[75],"motion":[77],"using":[78,93],"occlusion-robust":[79],"point":[80,85],"tracking.":[81],"We":[82,133,168,214],"then":[83],"lift":[84],"trajectories":[86],"into":[87],"estimate":[90],"articulation":[91],"models":[92],"unified":[96],"twist":[97],"estimation":[98],"formulation":[99],"that":[100,199],"robustly":[101],"estimates":[102],"revolute":[103],"prismatic":[105],"joint":[106],"parameters":[107],"single":[110],"optimization":[111],"pass.":[112],"Next,":[113],"associate":[115],"with":[117,150],"estimated":[118],"articulations":[119],"detect":[121],"contained":[122],"by":[124],"reasoning":[125],"over":[126],"parent-child":[127,147],"relations":[128],"at":[129],"identified":[130],"opening":[131],"states.":[132],"also":[134],"introduce":[135],"Arti4D-Semantic":[138],"dataset,":[139],"which":[140],"uniquely":[141],"combines":[142],"hierarchical":[143],"semantics":[145],"including":[146],"relation":[148],"labels":[149],"axis":[152],"annotations":[153],"across":[154],"62":[155],"in-the-wild":[156],"600":[160],"three":[164],"distinct":[165],"observation":[166],"paradigms.":[167],"extensively":[169],"evaluate":[170],"performance":[172],"MoMa-SG":[174],"on":[175,190],"two":[176],"datasets":[177],"ablate":[179],"key":[180],"design":[181],"choices":[182],"our":[184,200],"approach.":[185],"addition,":[187],"experiments":[189],"both":[191],"quadruped":[193],"manipulator":[197],"demonstrate":[198],"enable":[204],"robust":[205],"everyday":[211],"home":[212],"environments.":[213],"provide":[215],"code":[216],"data":[218],"at:":[219],"https://momasg.cs.uni-freiburg.de.":[220]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-20T00:00:00"}
