{"id":"https://openalex.org/W7154623820","doi":"https://doi.org/10.48550/arxiv.2604.13891","title":"Beyond Conservative Automated Driving in Multi-Agent Scenarios via Coupled Model Predictive Control and Deep Reinforcement Learning","display_name":"Beyond Conservative Automated Driving in Multi-Agent Scenarios via Coupled Model Predictive Control and Deep Reinforcement Learning","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154623820","doi":"https://doi.org/10.48550/arxiv.2604.13891"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.13891","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13891","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.13891","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086883629","display_name":"Saeed Rahmani","orcid":"https://orcid.org/0000-0002-2422-7109"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahmani, Saeed","raw_affiliation_strings":["Gavin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Gavin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065153648","display_name":"G\u00f6zde K\u00f6rpe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"K\u00f6rpe, G\u00f6zde","raw_affiliation_strings":["Gavin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Gavin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133792379","display_name":"Zhenlin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhenlin","raw_affiliation_strings":["Gavin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Gavin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133804226","display_name":"Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133754213","display_name":"Bruno Brito","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brito, Bruno","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052655645","display_name":"Simeon C. Calvert","orcid":"https://orcid.org/0000-0002-1173-0071"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Calvert, Simeon Craig","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133779081","display_name":"Bart van Arem","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"van Arem, Bart","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.7540000081062317,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.7540000081062317,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.1264999955892563,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.0348999984562397,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7236999869346619},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6944000124931335},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.6858000159263611},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.6383000016212463},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.534600019454956},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5328999757766724},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.4341999888420105},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.41029998660087585}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7236999869346619},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.708899974822998},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6944000124931335},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.6858000159263611},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.6383000016212463},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.534600019454956},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5328999757766724},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.515999972820282},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.4341999888420105},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42719998955726624},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.41029998660087585},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.375900000333786},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.36070001125335693},{"id":"https://openalex.org/C168031717","wikidata":"https://www.wikidata.org/wiki/Q1530280","display_name":"Balance (ability)","level":2,"score":0.30809998512268066},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.3005000054836273},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.2703999876976013},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2669000029563904},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.13891","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13891","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.13891","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13891","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automated":[0],"driving":[1,191],"at":[2],"unsignalized":[3],"intersections":[4],"is":[5,196],"challenging":[6],"due":[7],"to":[8,15,58,70,107,115],"complex":[9],"multi-vehicle":[10],"interactions":[11],"and":[12,18,56,84,99,174],"the":[13,94,101,133,136,164,169,181],"need":[14],"balance":[16,170],"safety":[17,54,172],"efficiency.":[19],"Model":[20],"Predictive":[21],"Control":[22],"(MPC)":[23],"offers":[24],"structured":[25],"constraint":[26],"handling":[27],"through":[28],"optimization":[29],"but":[30,50],"relies":[31],"on":[32],"hand-crafted":[33],"rules":[34],"that":[35,79,163],"often":[36,51],"produce":[37],"overly":[38],"conservative":[39],"behavior.":[40],"Deep":[41],"Reinforcement":[42],"Learning":[43],"(RL)":[44],"learns":[45],"adaptive":[46],"behaviors":[47],"from":[48],"experience":[49],"struggles":[52],"with":[53],"assurance":[55],"generalization":[57,189],"unseen":[59],"environments.":[60,192],"In":[61],"this":[62],"study,":[63],"we":[64],"present":[65],"an":[66],"integrated":[67,165],"MPC-RL":[68,80,92],"framework":[69,143],"improve":[71,168],"navigation":[72],"performance":[73,173],"in":[74,139,176],"multi-agent":[75,177],"scenarios.":[76],"Experiments":[77],"show":[78],"outperforms":[81],"standalone":[82],"MPC":[83,137,182],"end-to-end":[85,129,150],"RL":[86,151],"across":[87,190],"three":[88],"traffic-density":[89],"levels.":[90],"Collectively,":[91],"reduces":[93],"collision":[95],"rate":[96,103],"by":[97,104],"21%":[98],"improves":[100],"success":[102],"6.5%":[105],"compared":[106],"pure":[108],"MPC.":[109],"We":[110],"further":[111],"evaluate":[112],"zero-shot":[113],"transfer":[114,125],"a":[116,156,185],"highway":[117],"merging":[118],"scenario":[119],"without":[120],"retraining.":[121],"Both":[122],"MPC-based":[123],"methods":[124],"substantially":[126],"better":[127],"than":[128,149],"PPO,":[130],"which":[131,154],"highlights":[132],"role":[134],"of":[135],"backbone":[138],"cross-scenario":[140],"robustness.":[141],"The":[142,193],"also":[144],"shows":[145],"faster":[146],"loss":[147],"stabilization":[148],"during":[152],"training,":[153],"indicates":[155],"reduced":[157],"learning":[158],"burden.":[159],"These":[160],"results":[161],"suggest":[162],"approach":[166],"can":[167],"between":[171],"efficiency":[175],"intersection":[178],"scenarios,":[179],"while":[180],"component":[183],"provides":[184],"strong":[186],"foundation":[187],"for":[188],"implementation":[194],"code":[195],"available":[197],"open-source.":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-17T00:00:00"}
