{"id":"https://openalex.org/W4362496428","doi":"https://doi.org/10.1109/tgrs.2023.3264006","title":"Self-Supervision Interactive Alignment for Remote Sensing Image\u2013Audio Retrieval","display_name":"Self-Supervision Interactive Alignment for Remote Sensing Image\u2013Audio Retrieval","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4362496428","doi":"https://doi.org/10.1109/tgrs.2023.3264006"},"language":"en","primary_location":{"id":"doi:10.1109/tgrs.2023.3264006","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3264006","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065098091","display_name":"Jinghao Huang","orcid":"https://orcid.org/0009-0001-3362-3023"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210149102","display_name":"Sanya University","ror":"https://ror.org/04fa2qd52","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210149102"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jinghao Huang","raw_affiliation_strings":["Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","Shanghai Artificial Intelligence Laboratory, Shanghai, China","School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","institution_ids":["https://openalex.org/I4210149102","https://openalex.org/I196699116"]},{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]},{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003775716","display_name":"Yaxiong Chen","orcid":"https://orcid.org/0000-0002-2903-6723"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210149102","display_name":"Sanya University","ror":"https://ror.org/04fa2qd52","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210149102"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaxiong Chen","raw_affiliation_strings":["School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China","Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","Shanghai Artificial Intelligence Laboratory, Shanghai, China","Wuhan University of Technology Chongqing Research Institute, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]},{"raw_affiliation_string":"Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","institution_ids":["https://openalex.org/I4210149102","https://openalex.org/I196699116"]},{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]},{"raw_affiliation_string":"Wuhan University of Technology Chongqing Research Institute, Chongqing, China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011707621","display_name":"Shengwu Xiong","orcid":"https://orcid.org/0000-0002-4006-7029"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210149102","display_name":"Sanya University","ror":"https://ror.org/04fa2qd52","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210149102"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengwu Xiong","raw_affiliation_strings":["Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","Wuhan University of Technology Chongqing Research Institute, Chongqing, China","School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China","Shanghai Artificial Intelligence Laboratory, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya, China","institution_ids":["https://openalex.org/I4210149102","https://openalex.org/I196699116"]},{"raw_affiliation_string":"Wuhan University of Technology Chongqing Research Institute, Chongqing, China","institution_ids":["https://openalex.org/I196699116"]},{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]},{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018824735","display_name":"Xiaoqiang Lu","orcid":"https://orcid.org/0000-0002-7037-5188"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoqiang Lu","raw_affiliation_strings":["College of Physics and Information Engineering, Fuzhou University, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Physics and Information Engineering, Fuzhou University, Fuzhou, China","institution_ids":["https://openalex.org/I80947539"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5065098091"],"corresponding_institution_ids":["https://openalex.org/I196699116","https://openalex.org/I4210100255","https://openalex.org/I4210149102","https://openalex.org/I4391012619"],"apc_list":null,"apc_paid":null,"fwci":1.5885,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.83555445,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"61","issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11698","display_name":"Underwater Acoustics Research","score":0.9672999978065491,"subfield":{"id":"https://openalex.org/subfields/1910","display_name":"Oceanography"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8254221081733704},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7423017024993896},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.5688115954399109},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5383530259132385},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5316546559333801},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48676180839538574},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41009607911109924},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.3670996427536011},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3629881739616394},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.31806719303131104}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8254221081733704},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7423017024993896},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.5688115954399109},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5383530259132385},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5316546559333801},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48676180839538574},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41009607911109924},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.3670996427536011},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3629881739616394},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31806719303131104},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgrs.2023.3264006","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3264006","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[{"id":"https://openalex.org/G2160690789","display_name":null,"funder_award_id":"WUT:223110001","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G4653825012","display_name":null,"funder_award_id":"62176194","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4976606596","display_name":null,"funder_award_id":"cstc2021jcyj-msxmX1148","funder_id":"https://openalex.org/F4320323172","funder_display_name":"Natural Science Foundation of Chongqing"},{"id":"https://openalex.org/G5095014359","display_name":null,"funder_award_id":"SCKJ-JYRC-2022-76","funder_id":"https://openalex.org/F4320336619","funder_display_name":"Science and Technology Project of Nantong City"},{"id":"https://openalex.org/G5761330415","display_name":null,"funder_award_id":"2022KF0020","funder_id":"https://openalex.org/F4320325431","funder_display_name":"Wuhan University of Science and Technology"},{"id":"https://openalex.org/G6202514691","display_name":null,"funder_award_id":"SCKJ-JYRC-2022-17","funder_id":"https://openalex.org/F4320336619","funder_display_name":"Science and Technology Project of Nantong City"},{"id":"https://openalex.org/G6356431383","display_name":null,"funder_award_id":"2022ZD0160604","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323172","display_name":"Natural Science Foundation of Chongqing","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320325431","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320336619","display_name":"Science and Technology Project of Nantong City","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W2013535308","https://openalex.org/W2030899956","https://openalex.org/W2095483845","https://openalex.org/W2096733369","https://openalex.org/W2098738957","https://openalex.org/W2100235303","https://openalex.org/W2137225583","https://openalex.org/W2194775991","https://openalex.org/W2401246392","https://openalex.org/W2510520237","https://openalex.org/W2513342512","https://openalex.org/W2580615709","https://openalex.org/W2619383789","https://openalex.org/W2619697695","https://openalex.org/W2740474318","https://openalex.org/W2740755807","https://openalex.org/W2763822693","https://openalex.org/W2770954831","https://openalex.org/W2804744787","https://openalex.org/W2842511635","https://openalex.org/W2910457605","https://openalex.org/W2945202593","https://openalex.org/W2964109005","https://openalex.org/W2969475198","https://openalex.org/W2974770574","https://openalex.org/W2981905048","https://openalex.org/W2986131686","https://openalex.org/W2987489329","https://openalex.org/W2988699317","https://openalex.org/W2989871747","https://openalex.org/W2990330438","https://openalex.org/W2997041949","https://openalex.org/W2997786074","https://openalex.org/W3004137323","https://openalex.org/W3025346498","https://openalex.org/W3091459254","https://openalex.org/W3095909497","https://openalex.org/W3102166635","https://openalex.org/W3108367559","https://openalex.org/W3109212767","https://openalex.org/W3118120400","https://openalex.org/W3127230150","https://openalex.org/W3133500032","https://openalex.org/W3138516171","https://openalex.org/W3140792177","https://openalex.org/W3142124201","https://openalex.org/W3154430790","https://openalex.org/W3165084071","https://openalex.org/W3170962139","https://openalex.org/W3198480870","https://openalex.org/W3201849546","https://openalex.org/W4200436929","https://openalex.org/W4224911357","https://openalex.org/W4281384435","https://openalex.org/W4282934494","https://openalex.org/W4283728979","https://openalex.org/W4289538158","https://openalex.org/W4297808394","https://openalex.org/W6630875275","https://openalex.org/W6729977899","https://openalex.org/W6747225742","https://openalex.org/W6764499465","https://openalex.org/W6766904570","https://openalex.org/W6771446814","https://openalex.org/W6772096607","https://openalex.org/W6786549506","https://openalex.org/W6788213132","https://openalex.org/W6789155089","https://openalex.org/W6791353385","https://openalex.org/W6792679155","https://openalex.org/W6798410899","https://openalex.org/W6805211771","https://openalex.org/W6810930567"],"related_works":["https://openalex.org/W2329500892","https://openalex.org/W28991112","https://openalex.org/W2370726991","https://openalex.org/W2369710579","https://openalex.org/W4327728159","https://openalex.org/W4394266730","https://openalex.org/W1990856605","https://openalex.org/W2053783616","https://openalex.org/W2130409173","https://openalex.org/W2380243858"],"abstract_inverted_index":{"Cross-modal":[0],"remote":[1,10,18,44,72,105,126,155,183,191,202],"sensing":[2,11,19,45,73,106,127,156,184,192,203],"image-audio":[3,74,193,204],"retrieval":[4,75,205],"aims":[5],"to":[6,15,30,94,138,149,169],"use":[7],"audio":[8,131,164],"or":[9,21],"images":[12,20,107,157],"as":[13,133],"queries":[14],"retrieve":[16],"relevant":[17],"corresponding":[22],"audios.":[23,109,159],"Although":[24],"many":[25],"approaches":[26],"leverage":[27,120],"labeled":[28,38,46],"samples":[29,39,47,93],"achieve":[31],"good":[32],"performance,":[33],"the":[34,96,102,114,121,124,134,171,197],"performance":[35,206],"cost":[36],"of":[37,88,91,116,174,182],"is":[40,57,147],"high,":[41],"because":[42],"cross-modal":[43,55,71,99,140],"usually":[48],"requires":[49],"huge":[50],"labor":[51],"resources.":[52],"Therefore,":[53],"unsupervised":[54,70],"learning":[56,112],"very":[58],"important":[59],"in":[60],"real-world":[61],"applications.":[62],"In":[63],"this":[64],"paper,":[65],"we":[66,119,161],"propose":[67],"a":[68,142],"novel":[69,143],"approach,":[76],"named":[77],"<italic":[78],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[79],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Self-Supervision":[80],"Interactive":[81],"Alignment</i>":[82],"(SSIA),":[83],"which":[84,177],"can":[85,178],"take":[86],"advantage":[87],"large":[89],"amounts":[90],"unlabeled":[92],"learn":[95],"salient":[97,180],"information,":[98,118,176],"alignment":[100,145],"and":[101,108,130,158],"similarity":[103,122],"between":[104,123],"Since":[110],"self-supervised":[111],"lacks":[113],"supervision":[115,135],"label":[117],"input":[125],"image":[128,166],"information":[129,132,173,181],"information.":[136],"Besides,":[137],"perform":[139,199],"alignment,":[141],"interactive":[144],"module":[146,168],"designed":[148],"explore":[150],"fine":[151],"correspondence":[152],"relation":[153],"for":[154],"Moreover,":[160],"design":[162],"an":[163],"guided":[165],"de-redundant":[167],"reduce":[170],"redundant":[172],"visual":[175],"capture":[179],"images.":[185],"Extensive":[186],"experiments":[187],"on":[188],"four":[189],"widely-used":[190],"datasets":[194],"testify":[195],"that":[196],"SSIA":[198],"gain":[200],"better":[201],"than":[207],"other":[208],"compared":[209],"approaches.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
