{"id":"https://openalex.org/W4403791570","doi":"https://doi.org/10.1145/3664647.3680604","title":"UrbanCross: Enhancing Satellite Image-Text Retrieval with Cross-Domain Adaptation","display_name":"UrbanCross: Enhancing Satellite Image-Text Retrieval with Cross-Domain Adaptation","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791570","doi":"https://doi.org/10.1145/3664647.3680604"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680604","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680604","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5096912622","display_name":"Siru Zhong","orcid":"https://orcid.org/0009-0001-4465-8686"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Siru Zhong","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112993208","display_name":"Xixuan Hao","orcid":"https://orcid.org/0000-0003-0728-1944"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xixuan Hao","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065786703","display_name":"Y. H. Yan","orcid":"https://orcid.org/0009-0006-2546-1403"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yibo Yan","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100386018","display_name":"Ying Zhang","orcid":"https://orcid.org/0000-0001-6411-4486"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Zhang","raw_affiliation_strings":["Northwestern Polytechnical University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University, Xi'an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020880385","display_name":"Yangqiu Song","orcid":"https://orcid.org/0000-0002-7818-6090"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yangqiu Song","raw_affiliation_strings":["The Hong Kong University of Science and Technology, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018828723","display_name":"Yuxuan Liang","orcid":"https://orcid.org/0000-0003-2817-7337"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuxuan Liang","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5096912622"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.5732,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.85758238,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"6307","last_page":"6315"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.96670001745224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7251874208450317},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.5760233402252197},{"id":"https://openalex.org/keywords/satellite","display_name":"Satellite","score":0.558933675289154},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5505384206771851},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5081639289855957},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.45619872212409973},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4538711905479431},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.44526994228363037},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.40670204162597656},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32716113328933716},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3237961530685425},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1592329740524292},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08060002326965332},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.061606407165527344}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7251874208450317},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.5760233402252197},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.558933675289154},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5505384206771851},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5081639289855957},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.45619872212409973},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4538711905479431},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.44526994228363037},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.40670204162597656},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32716113328933716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3237961530685425},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1592329740524292},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08060002326965332},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.061606407165527344},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3664647.3680604","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680604","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-146516","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-146516","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5299999713897705,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2132077228","https://openalex.org/W2165698076","https://openalex.org/W2513506629","https://openalex.org/W2779054585","https://openalex.org/W2887131022","https://openalex.org/W3100245404","https://openalex.org/W3117344638","https://openalex.org/W3133962347","https://openalex.org/W3140792177","https://openalex.org/W3194015448","https://openalex.org/W3208803664","https://openalex.org/W4221146484","https://openalex.org/W4224911357","https://openalex.org/W4312795296","https://openalex.org/W4313121711","https://openalex.org/W4315778358","https://openalex.org/W4379806246","https://openalex.org/W4381790494","https://openalex.org/W4387969154","https://openalex.org/W4388189161","https://openalex.org/W4388624611","https://openalex.org/W4389474309","https://openalex.org/W4390874575","https://openalex.org/W4391021462"],"related_works":["https://openalex.org/W4394775207","https://openalex.org/W4389474468","https://openalex.org/W4300172004","https://openalex.org/W4321649381","https://openalex.org/W2997645659","https://openalex.org/W3180787869","https://openalex.org/W3203792196","https://openalex.org/W2955455867","https://openalex.org/W4295929828","https://openalex.org/W3156096827"],"abstract_inverted_index":{"Urbanization":[0],"challenges":[1],"underscore":[2],"the":[3,78,87,161],"necessity":[4],"for":[5,20,54,83,92],"effective":[6],"satellite":[7,56],"image-text":[8,57],"retrieval":[9,39,108,138],"methods":[10,25],"to":[11,72,141],"swiftly":[12],"access":[13],"specific":[14],"information":[15],"enriched":[16,65],"with":[17,66],"geographic":[18],"semantics":[19],"urban":[21,33,143],"applications.":[22],"However,":[23],"existing":[24],"often":[26],"overlook":[27],"significant":[28],"domain":[29,74,156,162],"gaps":[30],"across":[31,128],"diverse":[32],"landscapes,":[34],"primarily":[35],"focusing":[36],"on":[37],"enhancing":[38,126],"performance":[40,148],"within":[41],"single":[42],"domains.":[43,130],"To":[44],"tackle":[45],"this":[46],"issue,":[47],"we":[48],"present":[49],"UrbanCross,":[50],"a":[51,61,104,119],"new":[52,142],"framework":[53],"cross-domain":[55,63,122],"retrieval.":[58],"UrbanCross":[59,111],"leverages":[60],"high-quality,":[62],"dataset":[64,167],"extensive":[67],"geo-tags":[68],"from":[69],"three":[70],"countries":[71],"highlight":[73],"diversity.":[75],"It":[76],"employs":[77],"Large":[79],"Multimodal":[80],"Model":[81,90],"(LMM)":[82],"textual":[84],"refinement":[85],"and":[86,101,118,139,166],"Segment":[88],"Anything":[89],"(SAM)":[91],"visual":[93],"augmentation,":[94],"achieving":[95],"fine-grained":[96],"alignment":[97],"of":[98,150],"images,":[99],"segments":[100],"texts,":[102],"yielding":[103],"10%":[105],"improvement":[106],"in":[107,137],"performance.":[109],"Additionally,":[110],"incorporates":[112],"an":[113,146],"adaptive":[114],"curriculum-based":[115],"source":[116],"sampler":[117],"weighted":[120],"adversarial":[121],"fine-tuning":[123],"module,":[124],"progressively":[125],"adaptability":[127],"various":[129],"Extensive":[131],"experiments":[132],"confirm":[133],"UrbanCross's":[134],"superior":[135],"efficiency":[136],"adaptation":[140,157],"environments,":[144],"demonstrating":[145],"average":[147],"increase":[149],"15%":[151],"over":[152],"its":[153],"version":[154],"without":[155],"mechanisms,":[158],"effectively":[159],"bridging":[160],"gap.":[163],"Our":[164],"code":[165],"are":[168],"publicly":[169],"accessible":[170],"at":[171],"https://github.com/siruzhong/UrbanCross.":[172]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
