{"id":"https://openalex.org/W4392974062","doi":"https://doi.org/10.48550/arxiv.2403.11423","title":"VmambaIR: Visual State Space Model for Image Restoration","display_name":"VmambaIR: Visual State Space Model for Image Restoration","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392974062","doi":"https://doi.org/10.48550/arxiv.2403.11423"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2403.11423","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.11423","pdf_url":"https://arxiv.org/pdf/2403.11423","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2403.11423","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100629589","display_name":"Yuan Shi","orcid":"https://orcid.org/0000-0002-6150-7513"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shi, Yuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100751857","display_name":"Bin Xia","orcid":"https://orcid.org/0000-0002-5583-3275"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040683618","display_name":"Xiaoyu Jin","orcid":"https://orcid.org/0000-0003-3024-7437"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Xiaoyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100754894","display_name":"Xing Wang","orcid":"https://orcid.org/0000-0002-7176-7036"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048297544","display_name":"Tianyu Zhao","orcid":"https://orcid.org/0000-0003-2401-4098"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Tianyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006669765","display_name":"Xin Xia","orcid":"https://orcid.org/0000-0002-6302-3256"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101051966","display_name":"Xuefeng Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Xuefeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5026184280","display_name":"Wenming Yang","orcid":"https://orcid.org/0000-0002-2506-1286"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Wenming","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100629589"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9664000272750854,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9593999981880188,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6243897080421448},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5348946452140808},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5322670340538025},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5192989706993103},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4871461093425751},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.4646875858306885},{"id":"https://openalex.org/keywords/image-restoration","display_name":"Image restoration","score":0.44495218992233276},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.436125248670578},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.3304551839828491},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.17727196216583252},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16339904069900513},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.0657794177532196}],"concepts":[{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6243897080421448},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5348946452140808},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5322670340538025},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5192989706993103},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4871461093425751},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.4646875858306885},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.44495218992233276},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.436125248670578},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.3304551839828491},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.17727196216583252},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16339904069900513},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0657794177532196}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2403.11423","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.11423","pdf_url":"https://arxiv.org/pdf/2403.11423","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2403.11423","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2403.11423","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2403.11423","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.11423","pdf_url":"https://arxiv.org/pdf/2403.11423","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4392974062.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2357322570","https://openalex.org/W90581812","https://openalex.org/W2997591215","https://openalex.org/W2227541280","https://openalex.org/W2029783634","https://openalex.org/W2979181971","https://openalex.org/W2888591766","https://openalex.org/W2808332603","https://openalex.org/W2365681766","https://openalex.org/W2393963626"],"abstract_inverted_index":{"Image":[0],"restoration":[1,98,160],"is":[2],"a":[3,102,151],"critical":[4],"task":[5],"in":[6,49,144,209],"low-level":[7,216],"computer":[8],"vision,":[9],"aiming":[10],"to":[11,38,72,105,203],"restore":[12],"high-quality":[13],"images":[14],"from":[15],"degraded":[16],"inputs.":[17],"Various":[18],"models,":[19],"such":[20],"as":[21,200,211],"convolutional":[22],"neural":[23],"networks":[24,28],"(CNNs),":[25],"generative":[26],"adversarial":[27],"(GANs),":[29],"transformers,":[30],"and":[31,58,119,168,189,206],"diffusion":[32],"models":[33,57,199],"(DMs),":[34],"have":[35,47,64],"been":[36],"employed":[37],"address":[39,80],"this":[40],"problem":[41],"with":[42,75,92,184],"significant":[43],"impact.":[44],"However,":[45],"CNNs":[46],"limitations":[48],"capturing":[50],"long-range":[51],"dependencies.":[52],"DMs":[53],"require":[54],"large":[55],"prior":[56],"computationally":[59],"intensive":[60],"denoising":[61],"steps.":[62],"Transformers":[63],"powerful":[65],"modeling":[66,134,140],"capabilities":[67],"but":[68],"face":[69],"challenges":[70],"due":[71],"quadratic":[73],"complexity":[74,94],"input":[76],"image":[77,97,141,159,163,166,170],"size.":[78],"To":[79],"these":[81],"challenges,":[82],"we":[83,149],"propose":[84],"VmambaIR,":[85],"which":[86],"introduces":[87],"State":[88],"Space":[89],"Models":[90],"(SSMs)":[91],"linear":[93],"into":[95],"comprehensive":[96,152],"tasks.":[99,218],"We":[100],"utilize":[101],"Unet":[103],"architecture":[104],"stack":[106],"our":[107,155,177],"proposed":[108,126,178],"Omni":[109],"Selective":[110],"Scan":[111],"(OSS)":[112],"blocks,":[113],"consisting":[114],"of":[115,136,154,196],"an":[116,120],"OSS":[117],"module":[118],"Efficient":[121],"Feed-Forward":[122],"Network":[123],"(EFFN).":[124],"Our":[125,191],"omni":[127],"selective":[128],"scan":[129],"mechanism":[130],"overcomes":[131],"the":[132,194,204],"unidirectional":[133],"limitation":[135],"SSMs":[137],"by":[138],"efficiently":[139],"information":[142],"flows":[143],"all":[145],"six":[146],"directions.":[147],"Furthermore,":[148],"conducted":[150],"evaluation":[153],"VmambaIR":[156,179],"across":[157],"multiple":[158],"tasks,":[161],"including":[162],"deraining,":[164],"single":[165],"super-resolution,":[167],"real-world":[169],"super-resolution.":[171],"Extensive":[172],"experimental":[173],"results":[174],"demonstrate":[175],"that":[176],"achieves":[180],"state-of-the-art":[181],"(SOTA)":[182],"performance":[183],"much":[185],"fewer":[186],"computational":[187],"resources":[188],"parameters.":[190],"research":[192],"highlights":[193],"potential":[195],"state":[197],"space":[198],"promising":[201],"alternatives":[202],"transformer":[205],"CNN":[207],"architectures":[208],"serving":[210],"foundational":[212],"frameworks":[213],"for":[214],"next-generation":[215],"visual":[217]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":6}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
