{"id":"https://openalex.org/W3185774045","doi":"https://doi.org/10.1109/whispers52202.2021.9484057","title":"A Unified Multimodal Deep Learning Framework For Remote Sensing Imagery Classification","display_name":"A Unified Multimodal Deep Learning Framework For Remote Sensing Imagery Classification","publication_year":2021,"publication_date":"2021-03-24","ids":{"openalex":"https://openalex.org/W3185774045","doi":"https://doi.org/10.1109/whispers52202.2021.9484057","mag":"3185774045"},"language":"en","primary_location":{"id":"doi:10.1109/whispers52202.2021.9484057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/whispers52202.2021.9484057","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 11th Workshop on Hyperspectral Imaging and Signal Processing: Evolution in Remote Sensing (WHISPERS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075013625","display_name":"Danfeng Hong","orcid":"https://orcid.org/0000-0002-3212-9584"},"institutions":[{"id":"https://openalex.org/I2898391981","display_name":"Deutsches Zentrum f\u00fcr Luft- und Raumfahrt e. V. (DLR)","ror":"https://ror.org/04bwf3e34","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I2898391981"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Danfeng Hong","raw_affiliation_strings":["Germany Aerospace Center (DLR), Remote Sensing Technology Institute (IMF), Wessling, Germany"],"affiliations":[{"raw_affiliation_string":"Germany Aerospace Center (DLR), Remote Sensing Technology Institute (IMF), Wessling, Germany","institution_ids":["https://openalex.org/I2898391981"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066378186","display_name":"Lianru Gao","orcid":"https://orcid.org/0000-0003-3888-8124"},"institutions":[{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianru Gao","raw_affiliation_strings":["Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China","institution_ids":["https://openalex.org/I4210137199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100761149","display_name":"Xin Wu","orcid":"https://orcid.org/0000-0002-1733-3560"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Wu","raw_affiliation_strings":["School of Information and Electronics, Beijing Institute of Technology (BIT), Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Electronics, Beijing Institute of Technology (BIT), Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013885739","display_name":"Jing Yao","orcid":"https://orcid.org/0000-0003-1301-9758"},"institutions":[{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Yao","raw_affiliation_strings":["Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China","institution_ids":["https://openalex.org/I4210137199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034435383","display_name":"Naoto Yokoya","orcid":"https://orcid.org/0000-0002-7321-4590"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I4210126580","display_name":"RIKEN Center for Advanced Intelligence Project","ror":"https://ror.org/03ckxwf91","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210126580"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Naoto Yokoya","raw_affiliation_strings":["Graduate School of Frontier Sciences, the University of Tokyo, Chiba, Japan","RIKEN Center for Advanced Intelligence Project (AIP), RIKEN, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Frontier Sciences, the University of Tokyo, Chiba, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"RIKEN Center for Advanced Intelligence Project (AIP), RIKEN, Tokyo, Japan","institution_ids":["https://openalex.org/I4210126580"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100389658","display_name":"Bing Zhang","orcid":"https://orcid.org/0000-0001-7311-9844"},"institutions":[{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Zhang","raw_affiliation_strings":["College of Resources and Environment, University of Chinese Academy of Sciences, Beijing, China","Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Resources and Environment, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Key Laboratory of Digital Earth Science, Aerospace Information Research Institute (AIR), CAS, Beijing, China","institution_ids":["https://openalex.org/I4210137199"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5075013625"],"corresponding_institution_ids":["https://openalex.org/I2898391981"],"apc_list":null,"apc_paid":null,"fwci":0.2493,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.57728097,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.975600004196167,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7452104687690735},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6319563388824463},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6144351363182068},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5683979988098145},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5096085071563721},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5061008334159851},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.48918893933296204},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48521021008491516},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.47952890396118164},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.47341448068618774},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.4624137878417969},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4530557692050934},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.44509539008140564},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.4288880527019501},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.41274142265319824},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37066489458084106},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2942514419555664}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7452104687690735},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6319563388824463},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6144351363182068},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5683979988098145},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5096085071563721},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5061008334159851},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.48918893933296204},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48521021008491516},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.47952890396118164},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.47341448068618774},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.4624137878417969},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4530557692050934},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.44509539008140564},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.4288880527019501},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.41274142265319824},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37066489458084106},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2942514419555664},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/whispers52202.2021.9484057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/whispers52202.2021.9484057","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 11th Workshop on Hyperspectral Imaging and Signal Processing: Evolution in Remote Sensing (WHISPERS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1836465849","https://openalex.org/W2035875937","https://openalex.org/W2140797190","https://openalex.org/W2146062404","https://openalex.org/W2609880332","https://openalex.org/W2625894731","https://openalex.org/W2755992512","https://openalex.org/W2902746003","https://openalex.org/W2907147407","https://openalex.org/W2910655660","https://openalex.org/W2924927660","https://openalex.org/W2949117887","https://openalex.org/W2962702700","https://openalex.org/W2977355106","https://openalex.org/W2994639710","https://openalex.org/W3004968762","https://openalex.org/W3009883650","https://openalex.org/W3040988483","https://openalex.org/W3046027728","https://openalex.org/W3047443805","https://openalex.org/W3048631361","https://openalex.org/W3081753142","https://openalex.org/W3100714546","https://openalex.org/W3101012758","https://openalex.org/W3101640299","https://openalex.org/W3102692100","https://openalex.org/W3103695279","https://openalex.org/W3105021316","https://openalex.org/W3105298104","https://openalex.org/W3105997607","https://openalex.org/W3122774149","https://openalex.org/W3153012724","https://openalex.org/W6638667902"],"related_works":["https://openalex.org/W3013693939","https://openalex.org/W2159052453","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W2391745328","https://openalex.org/W4214649316","https://openalex.org/W2154495931","https://openalex.org/W2554790198"],"abstract_inverted_index":{"In":[0],"this":[1,50],"paper,":[2],"we":[3,52,85],"present":[4],"a":[5,23,40,90],"unified":[6],"deep":[7],"learning":[8,95,100],"framework":[9,123],"for":[10,17,32,139],"multimodal":[11],"remote":[12,126],"sensing":[13,127],"image":[14,128],"classification,":[15],"U-MDL":[16,19,81,122],"short.":[18],"attempts":[20],"to":[21,47,88,113],"develop":[22],"general":[24],"network":[25],"architecture":[26],"that":[27,97],"consists":[28],"of":[29,93,119,142],"two":[30],"subnetworks":[31],"feature":[33,36],"extraction":[34],"and":[35,45,70,117,133],"fusion,":[37,65,67,69],"respectively,":[38],"with":[39],"focus":[41],"on":[42],"\"which\",":[43],"\"when\",":[44],"\"how\"":[46],"fuse.":[48],"For":[49],"purpose,":[51],"detail":[53],"several":[54],"common":[55],"but":[56],"effective":[57],"fusion":[58],"modules":[59,74],"in":[60,105,124],"the":[61,115,120,125,140],"networks,":[62],"e.g.,":[63],"early":[64],"middle":[66],"late":[68],"encoder-decoder":[71],"fusion.":[72],"These":[73],"can":[75],"be":[76],"generalized":[77],"well":[78],"into":[79],"our":[80],"framework.":[82],"More":[83],"significantly,":[84],"also":[86],"emphasize":[87],"investigate":[89],"special":[91],"case":[92],"multi-modality":[94],"(MML),":[96],"is,":[98],"cross-modality":[99],"(CML)":[101],"which":[102],"widely":[103],"exists":[104],"real":[106],"applications.":[107],"Moreover,":[108],"extensive":[109],"experiments":[110],"are":[111,135],"conducted":[112],"demonstrate":[114],"superiority":[116],"effectiveness":[118],"proposed":[121],"classification":[129],"task.":[130],"The":[131],"codes":[132],"datasets":[134],"available":[136],"at:":[137],"https://github.com/danfenghong/IEEE_TGRS_MDL-RS":[138],"sake":[141],"reproducibility.":[143]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
