{"id":"https://openalex.org/W4416798816","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249233","title":"Rain Removal Via Vae-Enhanced Transformer with Hierarchical Feature Integration","display_name":"Rain Removal Via Vae-Enhanced Transformer with Hierarchical Feature Integration","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416798816","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249233"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249233","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100764456","display_name":"Yan Huang","orcid":"https://orcid.org/0000-0002-0575-0156"},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":true,"raw_author_name":"YaYa Huang","raw_affiliation_strings":["Monash University Malaysia,Malaysia"],"affiliations":[{"raw_affiliation_string":"Monash University Malaysia,Malaysia","institution_ids":["https://openalex.org/I11662577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071556259","display_name":"Lingchun Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"LiTong Liu","raw_affiliation_strings":["Monash University Malaysia,Malaysia"],"affiliations":[{"raw_affiliation_string":"Monash University Malaysia,Malaysia","institution_ids":["https://openalex.org/I11662577"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069916756","display_name":"KokSheik Wong","orcid":"https://orcid.org/0000-0002-4893-2291"},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"KokSheik Wong","raw_affiliation_strings":["Monash University Malaysia,Malaysia"],"affiliations":[{"raw_affiliation_string":"Monash University Malaysia,Malaysia","institution_ids":["https://openalex.org/I11662577"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100764456"],"corresponding_institution_ids":["https://openalex.org/I11662577"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.40641722,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1958","last_page":"1963"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.00570000009611249,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.0003000000142492354,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5774999856948853},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.45890000462532043},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.444599986076355},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42320001125335693},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.38350000977516174},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.3684999942779541},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.35269999504089355},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.3483999967575073},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3434000015258789}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6922000050544739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6395999789237976},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5774999856948853},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4699999988079071},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.45890000462532043},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.444599986076355},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42320001125335693},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.38350000977516174},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3684999942779541},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.35269999504089355},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.34310001134872437},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3357999920845032},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.3140000104904175},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2815999984741211},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2712000012397766},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2669999897480011},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2606000006198883},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2540000081062317},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2533000111579895},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249233","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2103559027","https://openalex.org/W2128254161","https://openalex.org/W2209874411","https://openalex.org/W2466666260","https://openalex.org/W2559264300","https://openalex.org/W2617393214","https://openalex.org/W2740982616","https://openalex.org/W2912435603","https://openalex.org/W2930755307","https://openalex.org/W2964212750","https://openalex.org/W2965669158","https://openalex.org/W3028045870","https://openalex.org/W3035250394","https://openalex.org/W3035326127","https://openalex.org/W3138516171","https://openalex.org/W3170697543","https://openalex.org/W3174756006","https://openalex.org/W3207918547","https://openalex.org/W4225672218","https://openalex.org/W4230654051","https://openalex.org/W4283023197","https://openalex.org/W4312812783","https://openalex.org/W4385245566","https://openalex.org/W4386075800","https://openalex.org/W4389519244"],"related_works":[],"abstract_inverted_index":{"Rain":[0],"removal":[1],"remains":[2],"a":[3,36,60,67,72,76,84,126,168],"challenging":[4],"task":[5],"in":[6,27,186],"computer":[7],"vision":[8],"due":[9],"to":[10,113,133],"the":[11,90,101,111,181],"complex":[12,162],"interference":[13],"of":[14,38,93],"rain":[15,43,94,123,163],"streaks":[16],"with":[17,71],"background":[18],"structures.":[19],"While":[20],"Transformer-based":[21,177],"methods":[22],"have":[23,32],"shown":[24],"promising":[25],"performances":[26],"modeling":[28],"long-range":[29],"dependencies,":[30],"they":[31],"drawbacks":[33],"such":[34],"as":[35,48,50],"lack":[37],"prior":[39],"guidance,":[40],"confusion":[41],"between":[42],"textures":[44,136],"and":[45,137,150,189],"scene":[46,119],"semantics,":[47],"well":[49],"insufficient":[51],"cross-scale":[52],"consistency.":[53],"To":[54],"address":[55],"these":[56],"limitations,":[57],"we":[58],"propose":[59],"novel":[61],"image":[62,178,187],"de-raining":[63],"framework":[64,166],"that":[65,88,144],"integrates":[66],"Variational":[68],"Autoencoder":[69],"(VAE)":[70],"Transformer":[73,102],"backbone":[74],"via":[75],"Latent-Guided":[77],"Attention":[78],"(LGA)":[79],"mechanism.":[80],"The":[81],"VAE":[82],"learns":[83],"global":[85],"latent":[86,173],"representation":[87],"captures":[89],"statistical":[91],"structure":[92],"patterns,":[95],"which":[96],"is":[97,131],"then":[98],"injected":[99],"into":[100],"at":[103],"multiple":[104],"levels":[105],"through":[106],"cross-attention":[107],"modules.":[108],"This":[109],"enables":[110],"network":[112],"focus":[114],"more":[115],"effectively":[116],"on":[117,153,171],"essential":[118],"features":[120],"while":[121,157],"suppressing":[122],"artifacts.":[124],"Furthermore,":[125],"hierarchical":[127],"feature":[128],"integration":[129],"strategy":[130],"adopted":[132],"fuse":[134],"low-level":[135],"high-level":[138],"semantics":[139],"across":[140],"scales.":[141],"Experiments":[142],"demonstrate":[143],"our":[145],"method":[146],"achieves":[147],"superior":[148],"PSNR":[149],"SSIM":[151],"scores":[152],"standard":[154],"benchmark":[155],"datasets,":[156],"maintaining":[158],"robust":[159],"performance":[160],"under":[161],"conditions.":[164],"Our":[165],"offers":[167],"new":[169],"perspective":[170],"leveraging":[172],"priors":[174],"for":[175,183],"enhancing":[176],"restoration,":[179],"paving":[180],"way":[182],"future":[184],"applications":[185],"de-weathering":[188],"denoising.":[190]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
