{"id":"https://openalex.org/W7129660942","doi":"https://doi.org/10.48550/arxiv.2602.13301","title":"DriveMamba: Task-Centric Scalable State Space Model for Efficient End-to-End Autonomous Driving","display_name":"DriveMamba: Task-Centric Scalable State Space Model for Efficient End-to-End Autonomous Driving","publication_year":2026,"publication_date":"2026-02-09","ids":{"openalex":"https://openalex.org/W7129660942","doi":"https://doi.org/10.48550/arxiv.2602.13301"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.13301","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126242280","display_name":"Haisheng Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Haisheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126219960","display_name":"Wei Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085957296","display_name":"Feixiang Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Feixiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126218830","display_name":"Junjie Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Junjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101944161","display_name":"Zhenjie Yang","orcid":"https://orcid.org/0000-0002-2570-1167"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Zhenjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126202108","display_name":"Junchi Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Junchi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.8726000189781189,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.8726000189781189,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.027899999171495438,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.014499999582767487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.670199990272522},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6656000018119812},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5853999853134155},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5501999855041504},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4542999863624573},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.4523000121116638},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.43230000138282776},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.3628999888896942},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.3382999897003174},{"id":"https://openalex.org/keywords/modularity","display_name":"Modularity (biology)","score":0.3328999876976013}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.781000018119812},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.670199990272522},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6656000018119812},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5853999853134155},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5501999855041504},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.548799991607666},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4542999863624573},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.4523000121116638},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.43230000138282776},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3628999888896942},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3393999934196472},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3382999897003174},{"id":"https://openalex.org/C2779478453","wikidata":"https://www.wikidata.org/wiki/Q6889748","display_name":"Modularity (biology)","level":2,"score":0.3328999876976013},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.3296999931335449},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3199000060558319},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.30090001225471497},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2879999876022339},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.28299999237060547},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2791999876499176},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C2776221188","wikidata":"https://www.wikidata.org/wiki/Q21072556","display_name":"Design space exploration","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.259799987077713},{"id":"https://openalex.org/C190502265","wikidata":"https://www.wikidata.org/wiki/Q17069496","display_name":"MNIST database","level":3,"score":0.257099986076355},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C96146094","wikidata":"https://www.wikidata.org/wiki/Q609057","display_name":"Unification","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.13301","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.13301","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.13301","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.13301","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"towards":[2],"End-to-End":[3],"Autonomous":[4],"Driving":[5],"(E2E-AD)":[6],"have":[7],"been":[8],"often":[9],"devoted":[10],"on":[11,32,38,191],"integrating":[12],"modular":[13],"designs":[14],"into":[15,121,138],"a":[16,26,100,122,170],"unified":[17],"framework":[18],"for":[19,104],"joint":[20],"optimization":[21],"e.g.":[22],"UniAD,":[23],"which":[24,107,144],"follow":[25],"sequential":[27,161],"paradigm":[28,103],"(i.e.,":[29],"perception-prediction-planning)":[30],"based":[31],"separable":[33],"Transformer":[34],"decoders":[35],"and":[36,56,61,68,76,85,117,132,193,200],"rely":[37],"dense":[39],"BEV":[40],"features":[41,131],"to":[42,90,164,178],"encode":[43],"scene":[44],"representations.":[45],"However,":[46],"such":[47],"manual":[48],"ordering":[49],"design":[50],"can":[51],"inevitably":[52],"cause":[53],"information":[54],"loss":[55],"cumulative":[57],"errors,":[58],"lacking":[59],"flexible":[60],"diverse":[62],"relation":[63,111],"modeling":[64,163],"among":[65],"different":[66],"modules":[67],"sensors.":[69],"Meanwhile,":[70],"insufficient":[71],"training":[72],"of":[73,78,87,203],"image":[74,130],"backbone":[75],"quadratic-complexity":[77],"attention":[79],"mechanism":[80],"also":[81],"hinder":[82],"the":[83,186,197],"scalability":[84],"efficiency":[86,202],"E2E-AD":[88],"system":[89],"handle":[91],"spatiotemporal":[92],"input.":[93],"To":[94],"this":[95],"end,":[96],"we":[97],"propose":[98],"DriveMamba,":[99],"Task-Centric":[101],"Scalable":[102],"efficient":[105,159],"E2E-AD,":[106],"integrates":[108],"dynamic":[109],"task":[110,134],"modeling,":[112],"implicit":[113],"view":[114],"correspondence":[115],"learning":[116],"long-term":[118],"temporal":[119],"fusion":[120],"single-stage":[123],"Unified":[124],"Mamba":[125],"decoder.":[126],"Specifically,":[127],"both":[128],"extracted":[129],"expected":[133],"outputs":[135],"are":[136,145],"converted":[137],"token-level":[139],"sparse":[140],"representations":[141],"in":[142,152],"advance,":[143],"then":[146],"sorted":[147],"by":[148],"their":[149],"instantiated":[150],"positions":[151],"3D":[153],"space.":[154],"The":[155],"linear-complexity":[156],"operator":[157],"enables":[158],"long-context":[160],"token":[162],"capture":[165],"task-related":[166],"inter-dependencies":[167],"simultaneously.":[168],"Additionally,":[169],"bidirectional":[171],"trajectory-guided":[172],"\"local-to-global\"":[173],"scan":[174],"method":[175],"is":[176],"designed":[177],"preserve":[179],"spatial":[180],"locality":[181],"from":[182],"ego-perspective,":[183],"thus":[184],"facilitating":[185],"ego-planning.":[187],"Extensive":[188],"experiments":[189],"conducted":[190],"nuScenes":[192],"Bench2Drive":[194],"datasets":[195],"demonstrate":[196],"superiority,":[198],"generalizability":[199],"great":[201],"DriveMamba.":[204]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-18T00:00:00"}
