{"id":"https://openalex.org/W7148540370","doi":"https://doi.org/10.48550/arxiv.2604.00360","title":"VADMamba++: Efficient Video Anomaly Detection via Hybrid Modeling in Grayscale Space","display_name":"VADMamba++: Efficient Video Anomaly Detection via Hybrid Modeling in Grayscale Space","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148540370","doi":"https://doi.org/10.48550/arxiv.2604.00360"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00360","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00360","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00360","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132815181","display_name":"Jihao Lyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lyu, Jihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132806114","display_name":"Minghua Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Minghua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132789087","display_name":"Jing Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Jing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132803655","display_name":"Yifei Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yifei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132810875","display_name":"Shuangli Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Shuangli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132823862","display_name":"Cheng Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Cheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5132815181"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.0066999997943639755,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.0010000000474974513,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grayscale","display_name":"Grayscale","score":0.660099983215332},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6057000160217285},{"id":"https://openalex.org/keywords/color-space","display_name":"Color space","score":0.5084999799728394},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5073999762535095},{"id":"https://openalex.org/keywords/chromatic-scale","display_name":"Chromatic scale","score":0.4927999973297119},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.45579999685287476},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.4262000024318695},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.4244000017642975}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7502999901771545},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7475000023841858},{"id":"https://openalex.org/C78201319","wikidata":"https://www.wikidata.org/wiki/Q685727","display_name":"Grayscale","level":3,"score":0.660099983215332},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6057000160217285},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5432000160217285},{"id":"https://openalex.org/C2961294","wikidata":"https://www.wikidata.org/wiki/Q166863","display_name":"Color space","level":3,"score":0.5084999799728394},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5073999762535095},{"id":"https://openalex.org/C196956537","wikidata":"https://www.wikidata.org/wiki/Q202021","display_name":"Chromatic scale","level":2,"score":0.4927999973297119},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.45579999685287476},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.4262000024318695},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.4244000017642975},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3352999985218048},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.32030001282691956},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.30799999833106995},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.30570000410079956},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.2549999952316284}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00360","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00360","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00360","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00360","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.6676628589630127,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"VADMamba":[0],"pioneered":[1],"the":[2,55,107,146],"introduction":[3],"of":[4,148],"Mamba":[5],"to":[6,38,62,88,110,121,139],"Video":[7],"Anomaly":[8],"Detection":[9],"(VAD),":[10],"achieving":[11],"high":[12],"accuracy":[13,168],"and":[14,31,72,98,115,136,189],"fast":[15],"inference":[16],"through":[17,93],"hybrid":[18,129],"proxy":[19,41,70],"tasks.":[20],"Nevertheless,":[21],"its":[22,36],"heavy":[23],"reliance":[24],"on":[25,54,176],"optical":[26],"flow":[27],"as":[28],"auxiliary":[29,75],"input":[30],"inter-task":[32],"fusion":[33,153],"scoring":[34,154],"constrains":[35],"applicability":[37],"a":[39,60,68,128,170,193],"single":[40,69,171],"task.":[42],"In":[43],"this":[44],"paper,":[45],"we":[46],"introduce":[47],"VADMamba++,":[48],"an":[49,151],"efficient":[50],"VAD":[51],"method":[52],"based":[53],"Gray-to-RGB":[56],"paradigm":[57,78],"that":[58,132,181],"enforces":[59],"Single-Channel":[61],"Three-Channel":[63],"reconstruction":[64],"mapping,":[65],"designed":[66],"for":[67],"task":[71,172],"operating":[73],"without":[74],"inputs.":[76,200],"This":[77],"compels":[79],"inferring":[80],"color":[81],"appearances":[82],"from":[83],"grayscale":[84,104],"structures,":[85],"allowing":[86],"anomalies":[87],"be":[89],"more":[90],"effectively":[91],"revealed":[92],"dual":[94],"inconsistencies":[95],"between":[96],"structure":[97],"chromatic":[99,116],"cues.":[100],"Specifically,":[101],"VADMamba++":[102,182],"reconstructs":[103],"frames":[105],"into":[106],"RGB":[108],"space":[109],"simultaneously":[111],"discriminate":[112],"structural":[113],"geometry":[114],"fidelity,":[117],"thereby":[118],"enhancing":[119],"sensitivity":[120],"explicit":[122,157],"visual":[123],"anomalies.":[124,149],"We":[125],"further":[126,166],"design":[127],"modeling":[130],"backbone":[131],"integrates":[133,156],"Mamba,":[134],"CNN,":[135],"Transformer":[137],"modules":[138],"capture":[140],"diverse":[141],"normal":[142],"patterns":[143],"while":[144,186],"suppressing":[145],"appearance":[147],"Furthermore,":[150],"intra-task":[152],"strategy":[155],"future-frame":[158],"prediction":[159],"errors":[160],"with":[161,197],"implicit":[162],"quantized":[163],"feature":[164],"errors,":[165],"improving":[167],"under":[169,192],"setting.":[173],"Extensive":[174],"experiments":[175],"three":[177],"benchmark":[178],"datasets":[179],"demonstrate":[180],"outperforms":[183],"state-of-the-art":[184],"methods":[185],"meeting":[187],"performance":[188],"efficiency,":[190],"especially":[191],"strict":[194],"single-task":[195],"setting":[196],"only":[198],"frame-level":[199]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
