{"id":"https://openalex.org/W7146978012","doi":"https://doi.org/10.1109/icvisp68610.2025.11451679","title":"Multi-Path Residual Attention Backbone With Dynamic Normalization Transformer Decoder For Semantic Segmentation","display_name":"Multi-Path Residual Attention Backbone With Dynamic Normalization Transformer Decoder For Semantic Segmentation","publication_year":2025,"publication_date":"2025-11-28","ids":{"openalex":"https://openalex.org/W7146978012","doi":"https://doi.org/10.1109/icvisp68610.2025.11451679"},"language":null,"primary_location":{"id":"doi:10.1109/icvisp68610.2025.11451679","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132569115","display_name":"Kefan Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Kefan Zhu","raw_affiliation_strings":["Xihua University,School of Computer and Software Engineering,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Xihua University,School of Computer and Software Engineering,Chengdu,China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132549899","display_name":"Zhaoyan Li","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaoyan Li","raw_affiliation_strings":["Xihua University,School of Computer and Software Engineering,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Xihua University,School of Computer and Software Engineering,Chengdu,China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5132604754","display_name":"Zhisheng Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhisheng Gao","raw_affiliation_strings":["Xihua University,School of Computer and Software Engineering,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Xihua University,School of Computer and Software Engineering,Chengdu,China","institution_ids":["https://openalex.org/I102345215"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5132569115"],"corresponding_institution_ids":["https://openalex.org/I102345215"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.75248058,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.4108999967575073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.4108999967575073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.18860000371932983,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.06469999998807907,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.5877000093460083},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5720999836921692},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5317000150680542},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.4934000074863434},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4724999964237213},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47200000286102295},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.43650001287460327},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3774000108242035}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8048999905586243},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6956999897956848},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.5877000093460083},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5720999836921692},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5317000150680542},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.4934000074863434},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4724999964237213},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.43650001287460327},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4059999883174896},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3774000108242035},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.37720000743865967},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3747999966144562},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.335099995136261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27000001072883606},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2696000039577484},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.2685000002384186},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26190000772476196}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icvisp68610.2025.11451679","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","score":0.4512227475643158,"display_name":"Life in Land"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1903029394","https://openalex.org/W2560023338","https://openalex.org/W2964309882","https://openalex.org/W3096609285","https://openalex.org/W3132455321","https://openalex.org/W4312815172","https://openalex.org/W4385391093","https://openalex.org/W4393159321","https://openalex.org/W4401070841","https://openalex.org/W4402715864","https://openalex.org/W4402733565"],"related_works":[],"abstract_inverted_index":{"Transformer":[0],"is":[1,93],"considered":[2],"to":[3,47,103,189],"be":[4],"very":[5],"powerful":[6],"for":[7,198],"basic":[8],"image":[9,32,49,120,133,183],"processing":[10],"tasks,":[11],"and":[12,38,57,62,73,100,107,112,132,139,147,172,217,227,234],"its":[13,173],"performance":[14],"has":[15],"been":[16],"verified":[17],"on":[18,55],"some":[19],"standard":[20],"datasets.":[21],"However,":[22],"in":[23,40,79,175,219,241],"actual":[24],"engineering":[25,59],"application":[26,60],"scenarios,":[27],"dynamic":[28,81,176],"environmental":[29],"changes,":[30],"inconsistent":[31,34],"quality,":[33],"target":[35],"size,":[36],"category":[37],"number":[39],"the":[41,48,71,77,84,142,145,167,192,232,238],"image,":[42],"etc.,":[43],"will":[44],"bring":[45],"challenges":[46],"semantic":[50,66,195],"segmentation":[51,67,196],"model.This":[52],"paper":[53,151],"focuses":[54],"specific":[56],"real":[58],"problems":[61],"proposes":[63,152],"a":[64,180],"robust":[65],"model,":[68],"which":[69],"improves":[70,166],"adaptability":[72,174],"generalization":[74,218],"ability":[75],"of":[76,169,237],"model":[78,125,170,197],"complex":[80,220],"environments.":[82],"During":[83],"feature":[85,105,110],"extraction":[86,106],"phase,":[87,149],"multi-path":[88,97],"residual":[89],"attention":[90,102],"backbone":[91],"network":[92],"proposed.":[94],"It":[95],"uses":[96],"convolutional":[98],"residuals":[99],"channel-wise":[101],"guide":[104],"fusion,":[108],"enhancing":[109],"representation":[111],"local":[113],"context":[114],"modeling":[115],"capabilities":[116],"while":[117],"enabling":[118],"fine-grained":[119],"structure":[121],"perception.":[122],"The":[123],"designed":[124],"can":[126],"better":[127],"handle":[128],"object":[129],"scale":[130,223],"variations":[131],"quality":[134],"differences":[135],"such":[136],"as":[137],"blur":[138],"jitter":[140],"within":[141],"scene.":[143],"In":[144],"decoding":[146],"reconstruction":[148],"this":[150,187],"replacing":[153],"traditional":[154],"Layer":[155],"Normalization":[156],"with":[157,222],"Dynamic":[158],"Normalization,":[159],"thereby":[160],"implementing":[161],"feature-adaptive":[162],"normalization.":[163],"This":[164,230],"further":[165],"stability":[168],"training":[171],"scenarios.":[177,200],"We":[178,185],"constructed":[179],"real-world,":[181],"robot-perspective":[182],"dataset.":[184],"used":[186],"dataset":[188],"comprehensively":[190],"evaluate":[191],"proposed":[193,239],"MDT":[194,205],"real-world":[199,242],"Experimental":[201],"results":[202],"demonstrate":[203],"that":[204],"outperforms":[206],"baseline":[207],"models":[208],"across":[209],"multiple":[210],"evaluation":[211],"metrics,":[212],"particularly":[213],"demonstrating":[214],"enhanced":[215],"robustness":[216],"environments":[221],"variations,":[224],"motion":[225],"blur,":[226],"illumination":[228],"interference.":[229],"demonstrates":[231],"effectiveness":[233],"practical":[235],"value":[236],"method":[240],"robotics":[243],"applications.":[244]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
