{"id":"https://openalex.org/W7148921804","doi":"https://doi.org/10.48550/arxiv.2604.01882","title":"A3R: Agentic Affordance Reasoning via Cross-Dimensional Evidence in 3D Gaussian Scenes","display_name":"A3R: Agentic Affordance Reasoning via Cross-Dimensional Evidence in 3D Gaussian Scenes","publication_year":2026,"publication_date":"2026-04-02","ids":{"openalex":"https://openalex.org/W7148921804","doi":"https://doi.org/10.48550/arxiv.2604.01882"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01882","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01882","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01882","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132861450","display_name":"Di Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Di","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132861419","display_name":"Jie Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132867712","display_name":"Guanbin Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Guanbin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132888566","display_name":"Ronghua Shang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Ronghua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132854330","display_name":"Yuhui Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yuhui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132853458","display_name":"Weisheng Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Weisheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132901178","display_name":"Guangming Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Guangming","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5132861450"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.4056999981403351,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.4056999981403351,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.2728999853134155,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.050599999725818634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.949400007724762},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.70169997215271},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6046000123023987},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.36970001459121704},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.35659998655319214},{"id":"https://openalex.org/keywords/empirical-evidence","display_name":"Empirical evidence","score":0.34459999203681946},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.3041999936103821}],"concepts":[{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.949400007724762},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.70169997215271},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6718999743461609},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6046000123023987},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5950000286102295},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4092000126838684},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.36970001459121704},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.34459999203681946},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33809998631477356},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2939000129699707},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2777999937534332},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C132758656","wikidata":"https://www.wikidata.org/wiki/Q5307365","display_name":"Dreyfus model of skill acquisition","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27309998869895935},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2551000118255615}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01882","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01882","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01882","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01882","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7129719853401184,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Affordance":[0],"reasoning":[1,75,105,147,173],"in":[2,21,46,174],"3D":[3,48,89,176],"Gaussian":[4,177],"scenes":[5],"aims":[6],"to":[7,112],"identify":[8],"the":[9,13,120,163],"region":[10],"that":[11,107,141,155],"supports":[12],"action":[14],"specified":[15],"by":[16],"a":[17,77,136],"given":[18],"text":[19],"instruction":[20],"complex":[22,47,175],"environments.":[23],"Existing":[24],"methods":[25],"typically":[26],"cast":[27],"this":[28,69,97],"problem":[29],"as":[30,76],"one-shot":[31,160],"prediction":[32,57],"from":[33,55,60],"static":[34,159],"scene":[35],"observations,":[36],"assuming":[37],"sufficient":[38],"evidence":[39,63,79,115,125,143,168],"is":[40,84],"already":[41],"available":[42],"for":[43,170],"reasoning.":[44],"However,":[45],"scenes,":[49],"many":[50],"failure":[51],"cases":[52],"arise":[53],"not":[54],"weak":[56],"capacity,":[58],"but":[59],"incomplete":[61],"task-relevant":[62],"under":[64],"fixed":[65],"observations.":[66],"To":[67,127],"address":[68],"limitation,":[70],"we":[71,99,133],"reformulate":[72],"fine-grained":[73,171],"affordance":[74,104,121,172],"sequential":[78,130],"acquisition":[80,116,144,169],"process,":[81],"where":[82],"ambiguity":[83],"progressively":[85],"reduced":[86],"through":[87,123],"complementary":[88],"geometric":[90],"and":[91,118,146],"2D":[92],"semantic":[93],"evidence.":[94],"Building":[95],"on":[96,151],"formulation,":[98],"propose":[100],"A3R,":[101],"an":[102,109],"agentic":[103,166],"framework":[106],"enables":[108],"MLLM-based":[110],"policy":[111,138],"iteratively":[113],"select":[114],"actions":[117],"update":[119],"belief":[122],"cross-dimensional":[124,167],"acquisition.":[126],"optimize":[128],"such":[129],"decision":[131],"making,":[132],"further":[134],"introduce":[135],"GRPO-based":[137],"learning":[139],"strategy":[140],"improves":[142],"efficiency":[145],"accuracy.":[148],"Extensive":[149],"experiments":[150],"scene-level":[152],"benchmarks":[153],"show":[154],"A3R":[156],"consistently":[157],"surpasses":[158],"baselines,":[161],"demonstrating":[162],"advantage":[164],"of":[165],"scenes.":[178]},"counts_by_year":[],"updated_date":"2026-04-04T06:15:33.020886","created_date":"2026-04-04T00:00:00"}
