{"id":"https://openalex.org/W3203076355","doi":"https://doi.org/10.1109/tpami.2022.3190471","title":"MetaDrive: Composing Diverse Driving Scenarios for Generalizable Reinforcement Learning","display_name":"MetaDrive: Composing Diverse Driving Scenarios for Generalizable Reinforcement Learning","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W3203076355","doi":"https://doi.org/10.1109/tpami.2022.3190471","mag":"3203076355","pmid":"https://pubmed.ncbi.nlm.nih.gov/35830412"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3190471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3190471","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064938053","display_name":"Quanyi Li","orcid":"https://orcid.org/0000-0003-0427-4554"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Quanyi Li","raw_affiliation_strings":["Centre for Perceptual, Interactive Intelligence, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Perceptual, Interactive Intelligence, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109521346","display_name":"Zhenghao Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhenghao Peng","raw_affiliation_strings":["The Chinese University of Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lan Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Lan Feng","raw_affiliation_strings":["ETH Zurich, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103254100","display_name":"Qihang Zhang","orcid":"https://orcid.org/0000-0003-1784-8166"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qihang Zhang","raw_affiliation_strings":["The Chinese University of Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054607440","display_name":"Zhenghai Xue","orcid":"https://orcid.org/0000-0002-9340-0366"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhenghai Xue","raw_affiliation_strings":["The Chinese University of Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033444412","display_name":"Bolei Zhou","orcid":"https://orcid.org/0000-0003-4030-0684"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bolei Zhou","raw_affiliation_strings":["University of California, Los Angeles, USA"],"raw_orcid":"https://orcid.org/0000-0003-4030-0684","affiliations":[{"raw_affiliation_string":"University of California, Los Angeles, USA","institution_ids":["https://openalex.org/I161318765"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064938053"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":14.2696,"has_fulltext":false,"cited_by_count":192,"citation_normalized_percentile":{"value":0.99591853,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"45","issue":"3","first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8813856244087219},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.8764674067497253},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8168010115623474},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7844035625457764},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5994572043418884},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5642077326774597},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5327503681182861},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4877644181251526},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.48529642820358276},{"id":"https://openalex.org/keywords/intelligent-agent","display_name":"Intelligent agent","score":0.4378302991390228},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.42040809988975525},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3497656583786011}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8813856244087219},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.8764674067497253},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8168010115623474},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7844035625457764},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5994572043418884},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5642077326774597},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5327503681182861},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4877644181251526},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.48529642820358276},{"id":"https://openalex.org/C74072328","wikidata":"https://www.wikidata.org/wiki/Q1142726","display_name":"Intelligent agent","level":2,"score":0.4378302991390228},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.42040809988975525},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3497656583786011},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2022.3190471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3190471","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:35830412","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35830412","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.800000011920929,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W1191599655","https://openalex.org/W1989750313","https://openalex.org/W2056877664","https://openalex.org/W2150468603","https://openalex.org/W2156256170","https://openalex.org/W2158782408","https://openalex.org/W2257979135","https://openalex.org/W2602275733","https://openalex.org/W2615547864","https://openalex.org/W2616635592","https://openalex.org/W2727840223","https://openalex.org/W2736601468","https://openalex.org/W2748378127","https://openalex.org/W2766413382","https://openalex.org/W2771506457","https://openalex.org/W2895921264","https://openalex.org/W2899076365","https://openalex.org/W2903709398","https://openalex.org/W2923090615","https://openalex.org/W2945991855","https://openalex.org/W2951984055","https://openalex.org/W2955189650","https://openalex.org/W2962803570","https://openalex.org/W2962867954","https://openalex.org/W2963039558","https://openalex.org/W2963094322","https://openalex.org/W2964657419","https://openalex.org/W2968983352","https://openalex.org/W2971031619","https://openalex.org/W2990747716","https://openalex.org/W2994073215","https://openalex.org/W3007553593","https://openalex.org/W3032377877","https://openalex.org/W3033324992","https://openalex.org/W3035172746","https://openalex.org/W3089529768","https://openalex.org/W3091006519","https://openalex.org/W3091492359","https://openalex.org/W3093963693","https://openalex.org/W3098009429","https://openalex.org/W3099689767","https://openalex.org/W3103780890","https://openalex.org/W3105017587","https://openalex.org/W3108630339","https://openalex.org/W3116213608","https://openalex.org/W3127488121","https://openalex.org/W3165743669","https://openalex.org/W3190215236","https://openalex.org/W3208422024","https://openalex.org/W3208836296","https://openalex.org/W3216772467","https://openalex.org/W4213377513","https://openalex.org/W4241541814","https://openalex.org/W4251408821","https://openalex.org/W4288594419","https://openalex.org/W4306882120","https://openalex.org/W6627932998","https://openalex.org/W6737893269","https://openalex.org/W6741002519","https://openalex.org/W6745594345","https://openalex.org/W6745935785","https://openalex.org/W6746316224","https://openalex.org/W6747473740","https://openalex.org/W6747941106","https://openalex.org/W6752963931","https://openalex.org/W6755355032","https://openalex.org/W6755921573","https://openalex.org/W6756840741","https://openalex.org/W6758846586","https://openalex.org/W6760425463","https://openalex.org/W6769596995","https://openalex.org/W6771750343","https://openalex.org/W6774126978","https://openalex.org/W6779265984","https://openalex.org/W6780587392","https://openalex.org/W6784178060","https://openalex.org/W6786812442","https://openalex.org/W6794641712","https://openalex.org/W6799560697","https://openalex.org/W6802251749","https://openalex.org/W6803030377","https://openalex.org/W6803274636","https://openalex.org/W6803572779","https://openalex.org/W6804601995","https://openalex.org/W6810152107"],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W2059640416","https://openalex.org/W1490753184","https://openalex.org/W2284465472","https://openalex.org/W2291782699","https://openalex.org/W1993948687","https://openalex.org/W2000169967","https://openalex.org/W2167883292"],"abstract_inverted_index":{"Driving":[0],"safely":[1],"requires":[2],"multiple":[3],"capabilities":[4],"from":[5,94],"human":[6],"and":[7,24,99,114,119,130,143,151,174,182,189],"intelligent":[8],"agents,":[9],"such":[10],"as":[11],"the":[12,17,21,25,32,41,51,70,96,100,149,152,155,160,163,184],"generalizability":[13,124],"to":[14,50,68,159],"unseen":[15,126],"environments,":[16],"safety":[18],"awareness":[19],"of":[20,35,40,53,72,90,111,154,162],"surrounding":[22],"traffic,":[23],"decision-making":[26],"in":[27,116,179],"complex":[28],"multi-agent":[29,120,132,175],"settings.":[30],"Despite":[31],"great":[33],"success":[34],"Reinforcement":[36],"Learning":[37],"(RL),":[38],"most":[39],"RL":[42,112,164],"research":[43,71],"works":[44],"investigate":[45],"each":[46],"capability":[47],"separately":[48],"due":[49],"lack":[52],"integrated":[54],"environments.":[55],"In":[56],"this":[57],"work,":[58],"we":[59,107],"develop":[60],"a":[61,109],"new":[62],"driving":[63,92],"simulation":[64],"platform":[65],"called":[66],"MetaDrive":[67,80,180],"support":[69],"generalizable":[73],"reinforcement":[74,172,176],"learning":[75,131,173,177],"algorithms":[76,178],"for":[77],"machine":[78],"autonomy.":[79],"is":[81],"highly":[82],"compositional,":[83],"which":[84],"can":[85],"generate":[86],"an":[87],"infinite":[88],"number":[89],"diverse":[91],"scenarios":[93,142,145],"both":[95,117,139],"procedural":[97],"generation":[98],"real":[101],"data":[102],"importing.":[103],"Based":[104],"on":[105,138],"MetaDrive,":[106],"construct":[108],"variety":[110],"tasks":[113],"baselines":[115],"single-agent":[118],"settings,":[121],"including":[122],"benchmarking":[123],"across":[125],"scenes,":[127],"safe":[128,171],"exploration,":[129],"traffic.":[133],"The":[134],"generalization":[135],"experiments":[136],"conducted":[137],"procedurally":[140],"generated":[141],"real-world":[144],"show":[146],"that":[147],"increasing":[148],"diversity":[150],"size":[153],"training":[156],"set":[157],"leads":[158],"improvement":[161],"agent's":[165],"generalizability.":[166],"We":[167],"further":[168],"evaluate":[169],"various":[170],"environments":[181],"provide":[183],"benchmarks.":[185],"Source":[186],"code,":[187],"documentation,":[188],"demo":[190],"video":[191],"are":[192],"available":[193],"at":[194],"https://metadriverse.github.io/metadrive.":[195]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":85},{"year":2024,"cited_by_count":55},{"year":2023,"cited_by_count":35},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":3}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
