{"id":"https://openalex.org/W7134962790","doi":"https://doi.org/10.48550/arxiv.2603.09138","title":"Rotation Equivariant Mamba for Vision Tasks","display_name":"Rotation Equivariant Mamba for Vision Tasks","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134962790","doi":"https://doi.org/10.48550/arxiv.2603.09138"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09138","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09138","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09138","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027944715","display_name":"Zhongchen Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Zhongchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128781252","display_name":"Qi Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090709230","display_name":"Keyu Huang","orcid":"https://orcid.org/0009-0005-2528-1560"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Keyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128742512","display_name":"Lei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027430892","display_name":"Deyu Meng","orcid":"https://orcid.org/0009-0001-8923-8167"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meng, Deyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128706391","display_name":"Zongben Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zongben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.45159998536109924,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.45159998536109924,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.12720000743865967,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.06589999794960022,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/equivariant-map","display_name":"Equivariant map","score":0.7954000234603882},{"id":"https://openalex.org/keywords/rotation","display_name":"Rotation (mathematics)","score":0.659600019454956},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6586999893188477},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.38190001249313354},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3000999987125397},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.29350000619888306}],"concepts":[{"id":"https://openalex.org/C171036898","wikidata":"https://www.wikidata.org/wiki/Q256355","display_name":"Equivariant map","level":2,"score":0.7954000234603882},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.659600019454956},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6586999893188477},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5471000075340271},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5117999911308289},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4745999872684479},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.43529999256134033},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.38190001249313354},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3000999987125397},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C68867621","wikidata":"https://www.wikidata.org/wiki/Q257360","display_name":"Mental rotation","level":3,"score":0.2736999988555908},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2678999900817871},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2563999891281128},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.25270000100135803},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09138","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09138","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09138","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09138","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Rotation":[0],"equivariance":[1,130,140,191],"constitutes":[2],"one":[3],"of":[4,28,106,127,198],"the":[5,26,93,128,134,142,196],"most":[6],"general":[7],"and":[8,34,67,80,116,157,169],"crucial":[9],"structural":[10],"priors":[11],"for":[12,48,100],"visual":[13,42,97,199],"data,":[14],"yet":[15],"it":[16],"remains":[17],"notably":[18],"absent":[19],"from":[20],"current":[21],"Mamba-based":[22,87],"vision":[23,101],"architectures.":[24,88],"Despite":[25],"success":[27],"Mamba":[29,43,98,118,200],"in":[30,38,51,84],"natural":[31],"language":[32],"processing":[33],"its":[35],"growing":[36],"adoption":[37],"computer":[39],"vision,":[40],"existing":[41],"models":[44,201],"fail":[45],"to":[46,60,176],"account":[47],"rotational":[49],"symmetry":[50],"their":[52,65],"design.":[53],"This":[54],"omission":[55],"renders":[56],"them":[57],"inherently":[58],"sensitive":[59],"image":[61,152,159],"rotations,":[62],"thereby":[63],"constraining":[64],"robustness":[66,168,197],"cross-task":[68],"generalization.":[69],"To":[70],"address":[71],"this":[72],"limitation,":[73],"we":[74,90,121],"incorporate":[75],"rotation":[76,95,112,139,167,190,203],"symmetry,":[77],"a":[78,109,123],"universal":[79],"fundamental":[81],"geometric":[82],"prior":[83],"images,":[85],"into":[86],"Specifically,":[89],"introduce":[91],"EQ-VMamba,":[92],"first":[94],"equivariant":[96,113],"architecture":[99,136],"tasks.":[102],"The":[103],"core":[104],"components":[105],"EQ-VMamba":[107,164],"include":[108],"carefully":[110],"designed":[111],"cross-scan":[114],"strategy":[115],"group":[117],"blocks.":[119],"Moreover,":[120],"provide":[122],"rigorous":[124],"theoretical":[125],"analysis":[126],"intrinsic":[129],"error,":[131],"demonstrating":[132],"that":[133,163,188],"proposed":[135],"enforces":[137],"end-to-end":[138],"throughout":[141],"network.":[143],"Extensive":[144],"experiments":[145],"across":[146],"multiple":[147],"benchmarks":[148],"--":[149,161],"including":[150],"high-level":[151],"classification,":[153],"mid-level":[154],"semantic":[155],"segmentation,":[156],"low-level":[158],"super-resolution":[160],"demonstrate":[162],"consistently":[165],"improves":[166],"achieves":[170],"superior":[171],"or":[172],"competitive":[173],"performance":[174,209],"compared":[175],"non-equivariant":[177],"baselines,":[178],"while":[179],"requiring":[180],"approximately":[181],"50\\%":[182],"fewer":[183],"parameters.":[184],"These":[185],"results":[186],"indicate":[187],"embedding":[189],"not":[192],"only":[193],"effectively":[194],"bolsters":[195],"against":[202],"transformations,":[204],"but":[205],"also":[206],"enhances":[207],"overall":[208],"with":[210],"significantly":[211],"improved":[212],"parameter":[213],"efficiency.":[214],"Code":[215],"is":[216],"available":[217],"at":[218],"https://github.com/zhongchenzhao/EQ-VMamba.":[219]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-12T00:00:00"}
