{"id":"https://openalex.org/W7138072040","doi":"https://doi.org/10.1609/aaai.v40i5.37393","title":"Sparse3DPR: Training-Free 3D Hierarchical Scene Parsing and Task-Adaptive Subgraph Reasoning from Sparse RGB Views","display_name":"Sparse3DPR: Training-Free 3D Hierarchical Scene Parsing and Task-Adaptive Subgraph Reasoning from Sparse RGB Views","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138072040","doi":"https://doi.org/10.1609/aaai.v40i5.37393"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i5.37393","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37393","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i5.37393","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030208674","display_name":"Haida Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Haida Feng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129642281","display_name":"Hao Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101845301","display_name":"Zewen Xu","orcid":"https://orcid.org/0009-0002-9700-3728"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zewen Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129731358","display_name":"Haolin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haolin Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034695019","display_name":"Chade Li","orcid":"https://orcid.org/0009-0002-5558-4739"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chade Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129697205","display_name":"Yihong Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yihong Wu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5030208674"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37136465,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"5","first_page":"3912","last_page":"3920"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8468000292778015,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8468000292778015,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.04529999941587448,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.025200000032782555,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6565999984741211},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6168000102043152},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.609499990940094},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5152000188827515},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.49799999594688416},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.46070000529289246},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4374000132083893}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7714999914169312},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6565999984741211},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6559000015258789},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6168000102043152},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.609499990940094},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5152000188827515},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.49799999594688416},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.46070000529289246},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4374000132083893},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4187999963760376},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4059000015258789},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3898000121116638},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35339999198913574},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.33009999990463257},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28700000047683716},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C131992880","wikidata":"https://www.wikidata.org/wiki/Q2528185","display_name":"Subgraph isomorphism problem","level":3,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i5.37393","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37393","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i5.37393","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37393","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6499202847480774}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recently,":[0],"large":[1],"language":[2],"models":[3],"(LLMs)":[4],"have":[5],"been":[6],"explored":[7],"widely":[8],"for":[9,20,50],"3D":[10,116],"scene":[11,52,74,117],"understanding.":[12],"Among":[13],"them,":[14],"training-free":[15,48],"approaches":[16],"are":[17],"gaining":[18],"attention":[19],"their":[21],"flexibility":[22],"and":[23,34,62,80,93,114,120,135,162],"generalization":[24,163],"over":[25],"training-based":[26,151],"methods.":[27],"However,":[28],"they":[29],"typically":[30],"struggle":[31],"with":[32,140,155],"accuracy":[33],"efficiency":[35,119],"in":[36],"practical":[37],"deployment.":[38],"To":[39],"address":[40],"the":[41,56,125,143],"problems,":[42],"we":[43,69,99],"propose":[44],"Sparse3DPR,":[45,128],"a":[46,71,101,131,136],"novel":[47],"framework":[49],"open-ended":[51],"understanding,":[53],"which":[54,88,129],"leverages":[55],"reasoning":[57,91,118],"capabilities":[58],"of":[59,127],"pre-trained":[60],"LLMs":[61],"requires":[63],"only":[64],"sparse-view":[65],"RGB":[66],"inputs.":[67],"Specifically,":[68],"introduce":[70],"hierarchical":[72],"plane-enhanced":[73],"graph":[75],"that":[76],"supports":[77],"open":[78],"vocabulary":[79],"adopts":[81],"dominant":[82],"planar":[83],"structures":[84],"as":[85],"spatial":[86],"anchors,":[87],"enables":[89],"clearer":[90],"chains":[92],"more":[94],"reliable":[95],"high-level":[96],"inferences.":[97],"Furthermore,":[98],"design":[100],"task-adaptive":[102],"subgraph":[103],"extraction":[104],"method":[105],"to":[106,150],"filter":[107],"query-irrelevant":[108],"information":[109],"dynamically,":[110],"reducing":[111],"contextual":[112],"noise":[113],"improving":[115],"accuracy.":[121],"Experimental":[122],"results":[123],"demonstrate":[124],"superiority":[126],"achieves":[130],"28.7%":[132],"EM@1":[133],"improvement":[134],"78.2%":[137],"speedup":[138],"compared":[139],"ConceptGraphs":[141],"on":[142,153],"Space3D-Bench.":[144],"Moreover,":[145],"Sparse3DPR":[146],"obtains":[147],"comparable":[148],"performance":[149],"methods":[152],"ScanQA,":[154],"additional":[156],"real-world":[157],"experiments":[158],"confirming":[159],"its":[160],"robustness":[161],"capability.":[164]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
