{"id":"https://openalex.org/W4415538285","doi":"https://doi.org/10.1145/3746027.3755361","title":"Visual Localization using Hybrid Feature Grid and Learned Weighted Global Point Cloud","display_name":"Visual Localization using Hybrid Feature Grid and Learned Weighted Global Point Cloud","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415538285","doi":"https://doi.org/10.1145/3746027.3755361"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755361","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755361","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100649295","display_name":"Junyi Wang","orcid":"https://orcid.org/0000-0002-3191-1662"},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junyi Wang","raw_affiliation_strings":["School of Computer Science and Technology, Shandong University, Qingdao, Shandong, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Shandong University, Qingdao, Shandong, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101491985","display_name":"Yue Qi","orcid":"https://orcid.org/0000-0001-9304-1933"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Qi","raw_affiliation_strings":["State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, China and Qingdao Research Institute of Beihang University, Qingdao, Shandong, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, China and Qingdao Research Institute of Beihang University, Qingdao, Shandong, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100649295"],"corresponding_institution_ids":["https://openalex.org/I80143920"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.43036641,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4222","last_page":"4231"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.8241000175476074},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6449999809265137},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5934000015258789},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.578000009059906},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.5676000118255615},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.4462999999523163},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4438000023365021},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.42179998755455017},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4117000102996826}],"concepts":[{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.8241000175476074},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.741100013256073},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7390999794006348},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6449999809265137},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6055999994277954},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5934000015258789},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.578000009059906},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.5676000118255615},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4438000023365021},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.42179998755455017},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4117000102996826},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.33820000290870667},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.3327000141143799},{"id":"https://openalex.org/C195958017","wikidata":"https://www.wikidata.org/wiki/Q1675268","display_name":"Iterative closest point","level":3,"score":0.29350000619888306},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.29159998893737793},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.28189998865127563},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C86369673","wikidata":"https://www.wikidata.org/wiki/Q1203659","display_name":"Simultaneous localization and mapping","level":4,"score":0.2791999876499176},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26579999923706055},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.257999986410141}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3755361","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755361","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2522940611","https://openalex.org/W2808571300","https://openalex.org/W2938672559","https://openalex.org/W3043971245","https://openalex.org/W3146082954","https://openalex.org/W3201936322","https://openalex.org/W4200150166","https://openalex.org/W4295129611","https://openalex.org/W4385318467","https://openalex.org/W4386171318","https://openalex.org/W4388915193","https://openalex.org/W4403510251","https://openalex.org/W4413145330"],"related_works":[],"abstract_inverted_index":{"To":[0,103,123],"fully":[1],"leverage":[2],"diverse":[3],"scene":[4],"representations":[5],"for":[6,145],"visual":[7],"relocalization,":[8],"we":[9,85,107,130],"propose":[10,108],"a":[11,54,65,71,79,132,151,172],"novel":[12],"localization":[13,26],"framework":[14],"that":[15,192],"systematically":[16],"establishes":[17],"inter-frame":[18],"relationships":[19],"and":[20,46,49,96,128,164,187,201],"integrates":[21],"multiple":[22],"feature":[23,152],"modalities.":[24],"Our":[25],"pipeline":[27],"comprises":[28],"three":[29,138,161],"key":[30],"stages,":[31],"containing":[32],"initial":[33,60],"pose":[34,41,50,83,105],"estimation":[35,52],"using":[36,78],"local":[37,73],"point":[38,68],"cloud":[39,69],"structure,":[40],"refinement":[42],"by":[43],"hand-crafted":[44,94],"features":[45,144],"3D":[47,97],"Gaussians,":[48],"confidence":[51,121],"through":[53],"leaned":[55],"global":[56],"representation.":[57],"Specifically,":[58],"the":[59,87,109,146,157,160,177,184],"stage":[61],"begins":[62],"with":[63,171],"aligning":[64],"known":[66],"source":[67],"to":[70,99,119,155,175],"predicted":[72],"Target":[74],"Point":[75,113],"Cloud":[76,114],"(TPC)":[77],"registration":[80],"algorithm.":[81],"For":[82],"refinement,":[84],"introduce":[86],"Hybrid":[88],"Feature":[89],"Grid":[90],"(HFG),":[91],"which":[92],"fuses":[93],"points":[95],"Gaussians":[98],"enrich":[100],"texture":[101],"cues.":[102],"assess":[104],"reliability,":[106],"learned":[110],"Weighted":[111],"Global":[112],"(WGPC),":[115],"aggregating":[116],"multi-frame":[117],"information":[118],"enhance":[120],"estimation.":[122],"jointly":[124],"learn":[125],"TPC,":[126],"HFG,":[127],"WGPC,":[129],"design":[131],"Siamese":[133],"Localization":[134],"Network":[135],"(SiaLocNet)":[136],"featuring":[137],"core":[139,162],"innovations,":[140],"including":[141],"learning":[142],"trajectory-based":[143],"limitation":[147],"of":[148,159,179],"single-view":[149],"inputs,":[150],"fusion":[153],"module":[154],"facilitate":[156],"construction":[158],"structures.":[163],"an":[165],"inverse":[166],"self":[167],"Chamfer":[168],"Distance":[169],"along":[170],"shape-aware":[173],"term":[174],"improve":[176],"robustness":[178],"WGPC.":[180],"Extensive":[181],"experiments":[182],"on":[183],"7":[185],"Scenes":[186],"Cambridge":[188],"Landmarks":[189],"datasets":[190],"demonstrate":[191],"our":[193],"method":[194],"achieves":[195],"state-ofthe-art":[196],"performance":[197],"across":[198],"both":[199],"indoor":[200],"outdoor":[202],"environments.":[203]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-25T00:00:00"}
