{"id":"https://openalex.org/W4401991036","doi":"https://doi.org/10.1109/icmew63481.2024.10645436","title":"Dual Attribute-Spatial Relation Alignment for 3D Visual Grounding","display_name":"Dual Attribute-Spatial Relation Alignment for 3D Visual Grounding","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4401991036","doi":"https://doi.org/10.1109/icmew63481.2024.10645436"},"language":"en","primary_location":{"id":"doi:10.1109/icmew63481.2024.10645436","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045448155","display_name":"X. Yue","orcid":"https://orcid.org/0000-0001-6956-3205"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"X. Yue","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China,Hefei,China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071731372","display_name":"Kaizhi Yang","orcid":"https://orcid.org/0000-0001-6274-7060"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaizhi Yang","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China,Hefei,China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053096325","display_name":"Kai Cheng","orcid":"https://orcid.org/0000-0003-1243-7093"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Cheng","raw_affiliation_strings":["School of Data Science, University of Science and Technology of China,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China,Hefei,China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055469774","display_name":"Jiebo Luo","orcid":"https://orcid.org/0000-0002-4516-9729"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiebo Luo","raw_affiliation_strings":["University of Rochester,Department of Computer Science,New York,United States"],"affiliations":[{"raw_affiliation_string":"University of Rochester,Department of Computer Science,New York,United States","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088031350","display_name":"Xuejin Chen","orcid":"https://orcid.org/0000-0003-0478-7018"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuejin Chen","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China,Hefei,China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5045448155"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.5248,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.65259356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7217094898223877},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.5963149070739746},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.5634293556213379},{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.5360107421875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5060636401176453},{"id":"https://openalex.org/keywords/ground","display_name":"Ground","score":0.43847405910491943},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43593788146972656},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.19797861576080322},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09568315744400024}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7217094898223877},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.5963149070739746},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.5634293556213379},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.5360107421875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5060636401176453},{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.43847405910491943},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43593788146972656},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.19797861576080322},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09568315744400024},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmew63481.2024.10645436","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2251329024","https://openalex.org/W2594519801","https://openalex.org/W2896457183","https://openalex.org/W3095974555","https://openalex.org/W3107521863","https://openalex.org/W3133833192","https://openalex.org/W3140398265","https://openalex.org/W3166396011","https://openalex.org/W3175234951","https://openalex.org/W3178489527","https://openalex.org/W3203949114","https://openalex.org/W3206171352","https://openalex.org/W4214684415","https://openalex.org/W4281732104","https://openalex.org/W4309397398","https://openalex.org/W4312852845","https://openalex.org/W4313162371","https://openalex.org/W4386075583","https://openalex.org/W4390871962","https://openalex.org/W4394593020","https://openalex.org/W6755207826","https://openalex.org/W6791353385","https://openalex.org/W6839446344","https://openalex.org/W6846210491"],"related_works":["https://openalex.org/W4234874385","https://openalex.org/W2021787609","https://openalex.org/W2363753014","https://openalex.org/W2385567678","https://openalex.org/W2355121635","https://openalex.org/W1967100394","https://openalex.org/W4312476862","https://openalex.org/W2016995243","https://openalex.org/W1495086659","https://openalex.org/W2382163390"],"abstract_inverted_index":{"3D":[0,14,53,62],"visual":[1],"grounding":[2,98],"is":[3,21,122],"an":[4],"emerging":[5],"research":[6],"area":[7],"dedicated":[8],"to":[9,76],"making":[10],"connections":[11],"between":[12,50],"the":[13,59,79,96,102,108,112,115],"physical":[15],"world":[16],"and":[17,42,46,52,61,70,124],"natural":[18],"language,":[19],"which":[20],"crucial":[22],"for":[23],"achieving":[24],"embodied":[25],"intelligence.":[26],"In":[27],"this":[28],"paper,":[29],"we":[30],"propose":[31],"DASANet,":[32],"a":[33,72],"Dual":[34],"Attribute-Spatial":[35],"relation":[36,48],"Alignment":[37],"Network":[38],"that":[39,119],"separately":[40,77],"models":[41],"aligns":[43],"object":[44],"attributes":[45],"spatial":[47],"features":[49],"language":[51,60],"vision":[54],"modalities.":[55],"We":[56],"decompose":[57],"both":[58],"point":[63],"cloud":[64],"input":[65],"into":[66],"two":[67,116],"separate":[68],"parts":[69],"design":[71],"dual-branch":[73],"attention":[74],"module":[75],"model":[78],"decomposed":[80],"inputs":[81],"while":[82],"preserving":[83],"global":[84],"context":[85],"in":[86],"attribute-spatial":[87],"feature":[88],"fusion":[89],"by":[90],"cross":[91],"attentions.":[92],"Our":[93],"DASANet":[94],"achieves":[95],"highest":[97],"accuracy":[99],"65.1%":[100],"on":[101],"Nr3D":[103],"dataset,":[104],"1.3%":[105],"higher":[106],"than":[107],"best":[109],"competitor.":[110],"Besides,":[111],"visualization":[113],"of":[114],"branches":[117],"proves":[118],"our":[120],"method":[121],"efficient":[123],"highly":[125],"interpretable.":[126]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
