{"id":"https://openalex.org/W3150696571","doi":"https://doi.org/10.1109/lgrs.2021.3068271","title":"Remote Sensing Image Generation Based on Attention Mechanism and VAE-MSGAN for ROI Extraction","display_name":"Remote Sensing Image Generation Based on Attention Mechanism and VAE-MSGAN for ROI Extraction","publication_year":2021,"publication_date":"2021-04-01","ids":{"openalex":"https://openalex.org/W3150696571","doi":"https://doi.org/10.1109/lgrs.2021.3068271","mag":"3150696571"},"language":"en","primary_location":{"id":"doi:10.1109/lgrs.2021.3068271","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2021.3068271","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087779583","display_name":"Libao Zhang","orcid":"https://orcid.org/0000-0002-0888-2330"},"institutions":[{"id":"https://openalex.org/I25254941","display_name":"Beijing Normal University","ror":"https://ror.org/022k4wk35","country_code":"CN","type":"education","lineage":["https://openalex.org/I25254941"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Libao Zhang","raw_affiliation_strings":["School of Artificial Intelligence, Beijing Normal University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing Normal University, Beijing, China","institution_ids":["https://openalex.org/I25254941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101898207","display_name":"Yanan Liu","orcid":"https://orcid.org/0000-0002-7095-0883"},"institutions":[{"id":"https://openalex.org/I25254941","display_name":"Beijing Normal University","ror":"https://ror.org/022k4wk35","country_code":"CN","type":"education","lineage":["https://openalex.org/I25254941"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanan Liu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing Normal University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing Normal University, Beijing, China","institution_ids":["https://openalex.org/I25254941"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5087779583"],"corresponding_institution_ids":["https://openalex.org/I25254941"],"apc_list":null,"apc_paid":null,"fwci":1.4959,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.8392145,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"19","issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8567814826965332},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7177238464355469},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.664261519908905},{"id":"https://openalex.org/keywords/region-of-interest","display_name":"Region of interest","score":0.6319186687469482},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.5876549482345581},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5011398792266846},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4816702604293823},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.44343942403793335},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4401322603225708},{"id":"https://openalex.org/keywords/multispectral-image","display_name":"Multispectral image","score":0.4250478744506836},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.41880300641059875},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4128061532974243},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4118371903896332},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4057885706424713},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.10123005509376526}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8567814826965332},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7177238464355469},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.664261519908905},{"id":"https://openalex.org/C19609008","wikidata":"https://www.wikidata.org/wiki/Q2138203","display_name":"Region of interest","level":2,"score":0.6319186687469482},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.5876549482345581},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5011398792266846},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4816702604293823},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44343942403793335},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4401322603225708},{"id":"https://openalex.org/C173163844","wikidata":"https://www.wikidata.org/wiki/Q1761440","display_name":"Multispectral image","level":2,"score":0.4250478744506836},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.41880300641059875},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4128061532974243},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4118371903896332},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4057885706424713},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.10123005509376526},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lgrs.2021.3068271","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2021.3068271","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7200000286102295}],"awards":[{"id":"https://openalex.org/G3872703625","display_name":null,"funder_award_id":"41771407","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4503850585","display_name":null,"funder_award_id":"L182029","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G5547827018","display_name":null,"funder_award_id":"61571050","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2099471712","https://openalex.org/W2133059825","https://openalex.org/W2593560791","https://openalex.org/W2790482089","https://openalex.org/W2791575150","https://openalex.org/W2901173979","https://openalex.org/W2920582597","https://openalex.org/W2963073614","https://openalex.org/W2964167449","https://openalex.org/W2967085153","https://openalex.org/W2985521021","https://openalex.org/W3101896960","https://openalex.org/W6640963894","https://openalex.org/W6685352114","https://openalex.org/W6687506355","https://openalex.org/W6765779288"],"related_works":["https://openalex.org/W2953246223","https://openalex.org/W4293320219","https://openalex.org/W3110074278","https://openalex.org/W4283584549","https://openalex.org/W2618858825","https://openalex.org/W2554314924","https://openalex.org/W2998859928","https://openalex.org/W3151498616","https://openalex.org/W4381885966","https://openalex.org/W4288256692"],"abstract_inverted_index":{"A":[0],"variety":[1],"of":[2,11,23,33,45,100,105,136,154,184],"deep":[3,47],"learning":[4],"approaches":[5],"have":[6],"been":[7],"applied":[8],"to":[9,73,96,112,130,149,191],"region":[10],"interest":[12],"(ROI)":[13],"extraction,":[14],"which":[15],"is":[16,71],"a":[17,53,110,145],"fundamental":[18],"task":[19],"in":[20,38,122],"the":[21,30,43,75,80,88,101,123,133,151,155,161,168,175,182],"field":[22],"remote":[24],"sensing":[25],"image":[26],"(RSI)":[27],"processing.":[28],"However,":[29],"unbalanced":[31],"distribution":[32,77],"positive":[34],"and":[35,67,78,119,139,166],"negative":[36],"samples":[37],"most":[39],"RSIs":[40,115],"greatly":[41],"restricts":[42],"performance":[44,183],"these":[46],"learning-based":[48],"methods.":[49,195],"In":[50],"this":[51],"study,":[52],"data":[54],"augmentation":[55],"method":[56,177],"based":[57],"on":[58],"variational":[59],"autoencoder-multiscale":[60],"generative":[61,194],"adversarial":[62],"network":[63],"(VAE-MSGAN)":[64],"with":[65,92,116],"spatial":[66,140],"channelwise":[68],"attention":[69],"(SCA)":[70],"proposed":[72,176],"balance":[74],"sample":[76],"improve":[79,150,181],"subsequent":[81],"ROI":[82,162,185],"extraction":[83,163,186],"results.":[84],"First,":[85],"we":[86,159],"combine":[87],"original":[89],"multispectral":[90],"information":[91],"handcrafted":[93],"texture":[94],"features":[95,104],"make":[97],"full":[98],"use":[99],"low-level":[102],"visual":[103,152],"RSIs.":[106],"We":[107,142],"then":[108],"design":[109],"VAE-MSGAN":[111],"generate":[113],"realistic":[114],"high":[117],"quality":[118,153],"diversity.":[120],"Specifically,":[121],"generator":[124],"construct,":[125],"SCA":[126],"blocks":[127],"are":[128],"introduced":[129],"adaptively":[131],"recalibrate":[132],"varying":[134],"importance":[135],"different":[137],"channels":[138],"regions.":[141],"also":[143,188],"build":[144],"multiscale":[146],"discriminator":[147],"architecture":[148],"generated":[156],"samples.":[157],"Finally,":[158],"compare":[160],"results":[164,172],"before":[165],"after":[167],"augmentation.":[169],"Our":[170],"experimental":[171],"demonstrate":[173],"that":[174],"can":[178],"not":[179],"only":[180],"but":[187],"be":[189],"superior":[190],"other":[192],"classical":[193]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
