{"id":"https://openalex.org/W4400525589","doi":"https://doi.org/10.1145/3626772.3657673","title":"Img2Loc: Revisiting Image Geolocalization using Multi-modality Foundation Models and Image-based Retrieval-Augmented Generation","display_name":"Img2Loc: Revisiting Image Geolocalization using Multi-modality Foundation Models and Image-based Retrieval-Augmented Generation","publication_year":2024,"publication_date":"2024-07-10","ids":{"openalex":"https://openalex.org/W4400525589","doi":"https://doi.org/10.1145/3626772.3657673"},"language":"en","primary_location":{"id":"doi:10.1145/3626772.3657673","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626772.3657673","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050749778","display_name":"Zhongliang Zhou","orcid":"https://orcid.org/0000-0003-4471-6759"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhongliang Zhou","raw_affiliation_strings":["University of Georgia, Athens, GA, USA"],"affiliations":[{"raw_affiliation_string":"University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059624873","display_name":"Jielu Zhang","orcid":"https://orcid.org/0000-0002-4321-0580"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jielu Zhang","raw_affiliation_strings":["University of Georgia, Athens, GA, USA"],"affiliations":[{"raw_affiliation_string":"University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067459053","display_name":"Zihan Guan","orcid":"https://orcid.org/0000-0002-0331-3403"},"institutions":[{"id":"https://openalex.org/I51556381","display_name":"University of Virginia","ror":"https://ror.org/0153tk833","country_code":"US","type":"education","lineage":["https://openalex.org/I51556381"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zihan Guan","raw_affiliation_strings":["University of Virginia, Charlottesville, VA, USA"],"affiliations":[{"raw_affiliation_string":"University of Virginia, Charlottesville, VA, USA","institution_ids":["https://openalex.org/I51556381"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033865274","display_name":"Mengxuan Hu","orcid":"https://orcid.org/0000-0002-8822-2884"},"institutions":[{"id":"https://openalex.org/I51556381","display_name":"University of Virginia","ror":"https://ror.org/0153tk833","country_code":"US","type":"education","lineage":["https://openalex.org/I51556381"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mengxuan Hu","raw_affiliation_strings":["University of Virginia, Charlottesville, VA, USA"],"affiliations":[{"raw_affiliation_string":"University of Virginia, Charlottesville, VA, USA","institution_ids":["https://openalex.org/I51556381"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087022523","display_name":"Ni Lao","orcid":"https://orcid.org/0000-0002-4034-7784"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ni Lao","raw_affiliation_strings":["Google LLC, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060956126","display_name":"Lan Mu","orcid":"https://orcid.org/0000-0003-0199-9509"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lan Mu","raw_affiliation_strings":["University of Georgia, Athens, GA, USA"],"affiliations":[{"raw_affiliation_string":"University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100359839","display_name":"Sheng Li","orcid":"https://orcid.org/0000-0003-1205-8632"},"institutions":[{"id":"https://openalex.org/I51556381","display_name":"University of Virginia","ror":"https://ror.org/0153tk833","country_code":"US","type":"education","lineage":["https://openalex.org/I51556381"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sheng Li","raw_affiliation_strings":["University of Virginia, Charlottesville, VA, USA"],"affiliations":[{"raw_affiliation_string":"University of Virginia, Charlottesville, VA, USA","institution_ids":["https://openalex.org/I51556381"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036007312","display_name":"Gengchen Mai","orcid":"https://orcid.org/0000-0002-7818-7309"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gengchen Mai","raw_affiliation_strings":["University of Georgia, Athens, GA, USA"],"affiliations":[{"raw_affiliation_string":"University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5050749778"],"corresponding_institution_ids":["https://openalex.org/I165733156"],"apc_list":null,"apc_paid":null,"fwci":3.4298,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.9371513,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2749","last_page":"2754"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.727394700050354},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5678176879882812},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5518324971199036},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5432639122009277},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.5291433930397034},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5187285542488098},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5129387378692627},{"id":"https://openalex.org/keywords/content-based-image-retrieval","display_name":"Content-based image retrieval","score":0.4416669011116028},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3845829963684082},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.05856055021286011}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.727394700050354},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5678176879882812},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5518324971199036},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5432639122009277},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.5291433930397034},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5187285542488098},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5129387378692627},{"id":"https://openalex.org/C2780052074","wikidata":"https://www.wikidata.org/wiki/Q1128648","display_name":"Content-based image retrieval","level":4,"score":0.4416669011116028},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3845829963684082},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.05856055021286011},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3626772.3657673","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626772.3657673","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Climate action","id":"https://metadata.un.org/sdg/13"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2199890863","https://openalex.org/W2284646714","https://openalex.org/W2587639398","https://openalex.org/W2598199894","https://openalex.org/W2886604692","https://openalex.org/W2895392434","https://openalex.org/W2963474852","https://openalex.org/W2964213180","https://openalex.org/W2981670313","https://openalex.org/W2986943971","https://openalex.org/W2998702515","https://openalex.org/W3023735075","https://openalex.org/W3034502973","https://openalex.org/W3035158519","https://openalex.org/W3096609285","https://openalex.org/W3110440461","https://openalex.org/W3179267034","https://openalex.org/W3195248159","https://openalex.org/W3212632252","https://openalex.org/W4206678795","https://openalex.org/W4221143046","https://openalex.org/W4284670538","https://openalex.org/W4286233797","https://openalex.org/W4290877196","https://openalex.org/W4384010587","https://openalex.org/W4386076111","https://openalex.org/W4386598503","https://openalex.org/W4387126838","https://openalex.org/W4389818116","https://openalex.org/W4390100354","https://openalex.org/W4392139636"],"related_works":["https://openalex.org/W2900811989","https://openalex.org/W2746816529","https://openalex.org/W2341223103","https://openalex.org/W2024252608","https://openalex.org/W2905186525","https://openalex.org/W2044706866","https://openalex.org/W2031096531","https://openalex.org/W4367727948","https://openalex.org/W3198880640","https://openalex.org/W3017331082"],"abstract_inverted_index":{"Geolocating":[0],"precise":[1,55],"locations":[2,33],"from":[3,62],"images":[4,29,36,134],"presents":[5],"a":[6,38,86,94],"challenging":[7],"problem":[8],"in":[9],"computer":[10],"vision":[11],"and":[12,27,52,66,76,150],"information":[13],"retrieval.":[14],"Traditional":[15],"methods":[16],"typically":[17],"employ":[18],"either":[19],"classification-dividing":[20],"the":[21,49,70,156,173],"Earth's":[22],"surface":[23],"into":[24],"grid":[25],"cells":[26],"classifying":[28],"accordingly,":[30],"or":[31,109],"retrieval-identifying":[32],"by":[34,48],"matching":[35],"with":[37,111,133],"database":[39],"of":[40,69,158,172],"image-location":[41],"pairs.":[42],"However,":[43],"classification-based":[44],"approaches":[45],"are":[46],"limited":[47],"cell":[50],"size":[51],"cannot":[53],"yield":[54],"predictions,":[56],"while":[57],"retrieval-based":[58],"systems":[59],"usually":[60],"suffer":[61],"poor":[63],"search":[64],"quality":[65],"inadequate":[67],"coverage":[68],"global":[71],"landscape":[72],"at":[73],"varied":[74],"scale":[75],"aggregation":[77],"levels.":[78],"To":[79],"overcome":[80],"these":[81],"drawbacks,":[82],"we":[83],"present":[84],"Img2Loc,":[85],"novel":[87],"system":[88,174],"that":[89],"redefines":[90],"image":[91],"geolocalization":[92],"as":[93,148],"text":[95],"generation":[96],"task.":[97],"This":[98],"is":[99],"achieved":[100],"using":[101],"cutting-edge":[102],"large":[103],"multi-modality":[104],"models":[105,161],"(LMMs)":[106],"like":[107],"GPT-4V":[108],"LLaVA":[110],"retrieval":[112],"augmented":[113],"generation.":[114],"Img2Loc":[115,152],"first":[116],"employs":[117],"CLIP-based":[118],"representations":[119],"to":[120],"generate":[121],"an":[122],"image-based":[123],"coordinate":[124],"query":[125,131],"database.":[126],"It":[127],"then":[128],"uniquely":[129],"combines":[130],"results":[132],"itself,":[135],"forming":[136],"elaborate":[137],"prompts":[138],"customized":[139],"for":[140],"LMMs.":[141],"When":[142],"tested":[143],"on":[144],"benchmark":[145],"datasets":[146],"such":[147],"Im2GPS3k":[149],"YFCC4k,":[151],"not":[153],"only":[154],"surpasses":[155],"performance":[157],"previous":[159],"state-of-the-art":[160],"but":[162],"does":[163],"so":[164],"without":[165],"any":[166],"model":[167],"training.":[168],"A":[169],"video":[170],"demonstration":[171],"can":[175],"be":[176],"accessed":[177],"via":[178],"this":[179],"link":[180],"https://drive.google.com/file/d/16A6A-mc7AyUoKHRH3_WBRToRC13sn7tU/view?usp=sharing":[181]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
