{"id":"https://openalex.org/W2794337547","doi":"https://doi.org/10.1109/iros.2018.8593758","title":"Multi-Agent Imitation Learning for Driving Simulation","display_name":"Multi-Agent Imitation Learning for Driving Simulation","publication_year":2018,"publication_date":"2018-10-01","ids":{"openalex":"https://openalex.org/W2794337547","doi":"https://doi.org/10.1109/iros.2018.8593758","mag":"2794337547"},"language":"en","primary_location":{"id":"doi:10.1109/iros.2018.8593758","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2018.8593758","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1803.01044","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017330847","display_name":"Raunak Bhattacharyya","orcid":"https://orcid.org/0000-0001-9254-8417"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Raunak P. Bhattacharyya","raw_affiliation_strings":["Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109358690","display_name":"Derek J. Phillips","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Derek J. Phillips","raw_affiliation_strings":["Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035437064","display_name":"Blake Wulfe","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Blake Wulfe","raw_affiliation_strings":["Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025330492","display_name":"Jeremy Morton","orcid":"https://orcid.org/0000-0002-3794-9258"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeremy Morton","raw_affiliation_strings":["Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036044637","display_name":"Alex Kuefler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alex Kuefler","raw_affiliation_strings":["Osaro Inc., San Francisco, CA, USA","Osaro Inc., 1182nd Street, Suite 200, San Francisco, CA, 94105, USA"],"affiliations":[{"raw_affiliation_string":"Osaro Inc., San Francisco, CA, USA","institution_ids":[]},{"raw_affiliation_string":"Osaro Inc., 1182nd Street, Suite 200, San Francisco, CA, 94105, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068326377","display_name":"Mykel J. Kochenderfer","orcid":"https://orcid.org/0000-0002-7238-9663"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mykel J. Kochenderfer","raw_affiliation_strings":["Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford Intelligent Systems Laboratory, Stanford University, Stanford, CA, 94305, USA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5017330847"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.9928123,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.78936393,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1534","last_page":"1539"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.8133910298347473},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.6799227595329285},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6746824979782104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6705406308174133},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5279245376586914},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4405028820037842},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.40328913927078247},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.15980425477027893},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.09624499082565308}],"concepts":[{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.8133910298347473},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.6799227595329285},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6746824979782104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6705406308174133},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5279245376586914},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4405028820037842},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40328913927078247},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.15980425477027893},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.09624499082565308}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iros.2018.8593758","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2018.8593758","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1803.01044","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1803.01044","pdf_url":"https://arxiv.org/pdf/1803.01044","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2794337547","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1803.01044.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1803.01044","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1803.01044","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1803.01044","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1803.01044","pdf_url":"https://arxiv.org/pdf/1803.01044","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1542941925","https://openalex.org/W1974812331","https://openalex.org/W1999874108","https://openalex.org/W2034368206","https://openalex.org/W2107544712","https://openalex.org/W2160643434","https://openalex.org/W2165413656","https://openalex.org/W2166302491","https://openalex.org/W2167485994","https://openalex.org/W2168359464","https://openalex.org/W2328067583","https://openalex.org/W2342662072","https://openalex.org/W2434014514","https://openalex.org/W2519106163","https://openalex.org/W2545546008","https://openalex.org/W2580495915","https://openalex.org/W2581637843","https://openalex.org/W2605135824","https://openalex.org/W2735089625","https://openalex.org/W2739748921","https://openalex.org/W2770884134","https://openalex.org/W2883057932","https://openalex.org/W2949608212","https://openalex.org/W2951276827","https://openalex.org/W2951520714","https://openalex.org/W2962957031","https://openalex.org/W3148740559","https://openalex.org/W6638018090","https://openalex.org/W6640174482","https://openalex.org/W6718092244","https://openalex.org/W6735913928","https://openalex.org/W6741115023","https://openalex.org/W6741832134","https://openalex.org/W6746015766","https://openalex.org/W6746462176"],"related_works":["https://openalex.org/W2883057932","https://openalex.org/W3089591632","https://openalex.org/W2976846901","https://openalex.org/W2969966185","https://openalex.org/W3014012509","https://openalex.org/W2979363950","https://openalex.org/W2987890415","https://openalex.org/W3005850366","https://openalex.org/W2292969843","https://openalex.org/W3003285662","https://openalex.org/W3049691496","https://openalex.org/W2953942860","https://openalex.org/W3004268170","https://openalex.org/W3098974658","https://openalex.org/W1252772818","https://openalex.org/W1512345936","https://openalex.org/W2244447337","https://openalex.org/W3145417110","https://openalex.org/W2891046288","https://openalex.org/W3171077607"],"abstract_inverted_index":{"Simulation":[0],"is":[1],"an":[2],"appealing":[3],"option":[4],"for":[5,71],"validating":[6],"the":[7,72,124],"safety":[8],"of":[9,74,127],"autonomous":[10],"vehicles.":[11],"Generative":[12],"Adversarial":[13],"Imitation":[14],"Learning":[15],"(GAIL)":[16],"has":[17],"recently":[18],"been":[19],"shown":[20],"to":[21,44,90],"learn":[22],"representative":[23],"human":[24,28,128],"driver":[25,29],"models.":[26],"These":[27],"models":[30,69],"were":[31],"learned":[32],"through":[33,94],"training":[34,56],"in":[35,42,99,118],"single-agent":[36,104],"environments,":[37],"but":[38],"they":[39],"have":[40],"difficulty":[41],"generalizing":[43],"multi-agent":[45,120],"driving":[46,75],"scenarios.":[47],"We":[48,87],"argue":[49],"these":[50,92],"difficulties":[51],"arise":[52],"because":[53],"observations":[54],"at":[55,115],"and":[57,122],"test":[58],"time":[59,85],"are":[60],"sampled":[61],"from":[62],"different":[63],"distributions.":[64],"This":[65],"difference":[66],"makes":[67],"such":[68],"unsuitable":[70],"simulation":[73],"scenes,":[76],"where":[77],"multiple":[78],"agents":[79],"must":[80],"interact":[81],"realistically":[82],"over":[83],"long":[84],"horizons.":[86],"extend":[88],"GAIL":[89,105],"address":[91],"shortcomings":[93],"a":[95,119],"parameter-sharing":[96],"approach":[97],"grounded":[98],"curriculum":[100],"learning.":[101],"Compared":[102],"with":[103],"policies,":[106],"policies":[107],"generated":[108],"by":[109],"our":[110],"PS-GAIL":[111],"method":[112],"prove":[113],"superior":[114],"interacting":[116],"stably":[117],"setting":[121],"capturing":[123],"emergent":[125],"behavior":[126],"drivers.":[129]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
