{"id":"https://openalex.org/W4403826703","doi":"https://doi.org/10.1109/access.2024.3487171","title":"Enhancing Visual Place Recognition With Hybrid Attention Mechanisms in MixVPR","display_name":"Enhancing Visual Place Recognition With Hybrid Attention Mechanisms in MixVPR","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4403826703","doi":"https://doi.org/10.1109/access.2024.3487171"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3487171","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3487171","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2024.3487171","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045863168","display_name":"Jun Hu","orcid":"https://orcid.org/0000-0002-7094-1901"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Hu","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0002-7094-1901","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072381801","display_name":"Jiwei Nie","orcid":"https://orcid.org/0000-0003-3639-4729"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiwei Nie","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0003-3639-4729","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061986097","display_name":"Zuotao Ning","orcid":"https://orcid.org/0000-0003-3114-2784"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuotao Ning","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0003-3114-2784","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034810639","display_name":"Chaolu Feng","orcid":"https://orcid.org/0000-0002-5575-2328"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaolu Feng","raw_affiliation_strings":["Key Laboratory of Intelligent Computing in Medical Image, Ministry of Education, Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0002-5575-2328","affiliations":[{"raw_affiliation_string":"Key Laboratory of Intelligent Computing in Medical Image, Ministry of Education, Shenyang, China","institution_ids":["https://openalex.org/I1327237609"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Luyang Wang","orcid":"https://orcid.org/0009-0002-1221-1174"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Luyang Wang","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0009-0002-1221-1174","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jingyao Li","orcid":"https://orcid.org/0009-0006-8059-9923"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyao Li","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0009-0006-8059-9923","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101465765","display_name":"Shuai Cheng","orcid":"https://orcid.org/0009-0006-5871-6572"},"institutions":[{"id":"https://openalex.org/I4210134419","display_name":"Neusoft (China)","ror":"https://ror.org/02zc84r97","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Cheng","raw_affiliation_strings":["Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China"],"raw_orcid":"https://orcid.org/0009-0006-5871-6572","affiliations":[{"raw_affiliation_string":"Neusoft Reach Automotive Technology (Shenyang) Company Ltd., Shenyang, China","institution_ids":["https://openalex.org/I4210134419"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1738783,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":null,"first_page":"159847","last_page":"159859"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9747999906539917,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9552000164985657,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7114986181259155},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3663915991783142},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36525237560272217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3596663177013397},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35497552156448364},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.343967080116272}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7114986181259155},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3663915991783142},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36525237560272217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3596663177013397},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35497552156448364},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.343967080116272}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3487171","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3487171","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:29a59b5d8d2345d5a1cdf4b61f775d9c","is_oa":true,"landing_page_url":"https://doaj.org/article/29a59b5d8d2345d5a1cdf4b61f775d9c","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 159847-159859 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3487171","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3487171","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W2013270301","https://openalex.org/W2073761981","https://openalex.org/W2147238549","https://openalex.org/W2204975001","https://openalex.org/W2284029970","https://openalex.org/W2580440899","https://openalex.org/W2619522967","https://openalex.org/W2737075200","https://openalex.org/W2744874208","https://openalex.org/W2885052112","https://openalex.org/W2939122829","https://openalex.org/W2940791172","https://openalex.org/W2951019013","https://openalex.org/W2963588253","https://openalex.org/W2964271799","https://openalex.org/W2984478347","https://openalex.org/W3034213661","https://openalex.org/W3034275286","https://openalex.org/W3043075211","https://openalex.org/W3095367607","https://openalex.org/W3110536152","https://openalex.org/W3124676898","https://openalex.org/W3163149666","https://openalex.org/W3173736705","https://openalex.org/W3184915579","https://openalex.org/W3204429916","https://openalex.org/W3206622090","https://openalex.org/W4210786584","https://openalex.org/W4296890702","https://openalex.org/W4312336574","https://openalex.org/W4312854990","https://openalex.org/W4319299901","https://openalex.org/W4319300119","https://openalex.org/W4366208220","https://openalex.org/W4383109186","https://openalex.org/W4386066001","https://openalex.org/W4386076349","https://openalex.org/W4389819300","https://openalex.org/W4390872200","https://openalex.org/W4392120897","https://openalex.org/W4399151845","https://openalex.org/W4402660141","https://openalex.org/W4402716379","https://openalex.org/W4403679663","https://openalex.org/W6636494156","https://openalex.org/W6766978945","https://openalex.org/W6851800889","https://openalex.org/W6859146851","https://openalex.org/W6861928822","https://openalex.org/W6868833508","https://openalex.org/W6869461496"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Visual":[0],"Place":[1],"Recognition":[2],"(VPR)":[3],"is":[4,22],"a":[5,48,100],"fundamental":[6],"task":[7],"in":[8,53,79],"robotics":[9],"and":[10,96,118,150],"computer":[11],"vision,":[12],"where":[13],"the":[14,112,123,154,161],"ability":[15],"to":[16,77,160],"recognize":[17],"locations":[18],"from":[19],"visual":[20,125],"inputs":[21],"crucial":[23],"for":[24,127],"autonomous":[25],"navigation":[26],"systems.":[27],"Traditional":[28],"methods,":[29],"which":[30],"rely":[31],"on":[32,61,133],"handcrafted":[33],"features":[34],"or":[35],"standard":[36],"convolutional":[37],"neural":[38],"networks":[39],"(CNNs),":[40],"struggle":[41],"with":[42],"environmental":[43],"changes":[44],"that":[45,92,138],"significantly":[46],"alter":[47],"place\u2019s":[49],"appearance.":[50],"Recent":[51],"advancements":[52],"deep":[54],"learning":[55],"have":[56],"improved":[57,89],"VPR":[58,135],"by":[59],"focusing":[60],"deep-learned":[62],"features,":[63],"enhancing":[64],"robustness":[65],"under":[66],"varying":[67],"conditions.":[68],"However,":[69],"these":[70,84],"methods":[71],"often":[72],"overlook":[73],"saliency":[74,109],"cues,":[75],"leading":[76],"inefficiencies":[78],"dynamic":[80],"scenes.":[81],"To":[82],"address":[83],"limitations,":[85],"we":[86],"propose":[87],"an":[88],"MixVPR":[90],"model":[91],"incorporates":[93],"both":[94],"self-attention":[95],"cross-attention":[97],"mechanisms":[98,159],"through":[99],"spatial-wise":[101],"hybrid":[102],"attention":[103,158],"mechanism.":[104],"This":[105],"enhancement":[106],"integrates":[107],"spatial":[108],"cues":[110],"into":[111],"global":[113],"image":[114],"embedding,":[115],"improving":[116],"accuracy":[117],"reliability.":[119],"We":[120],"also":[121],"utilize":[122],"DINOv2":[124],"transformer":[126],"robust":[128],"feature":[129],"extraction.":[130],"Extensive":[131],"experiments":[132],"mainstream":[134],"benchmarks":[136],"demonstrate":[137],"our":[139,157],"method":[140],"achieves":[141],"superior":[142],"performance":[143,163],"while":[144],"maintaining":[145],"computational":[146],"efficiency.":[147],"Ablation":[148],"studies":[149],"visualizations":[151],"further":[152],"validate":[153],"contributions":[155],"of":[156],"model\u2019s":[162],"improvement.":[164]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
