{"id":"https://openalex.org/W3157776331","doi":"https://doi.org/10.1109/cdc45484.2021.9683135","title":"Graph Neural Network Reinforcement Learning for Autonomous Mobility-on-Demand Systems","display_name":"Graph Neural Network Reinforcement Learning for Autonomous Mobility-on-Demand Systems","publication_year":2021,"publication_date":"2021-12-14","ids":{"openalex":"https://openalex.org/W3157776331","doi":"https://doi.org/10.1109/cdc45484.2021.9683135","mag":"3157776331"},"language":"en","primary_location":{"id":"doi:10.1109/cdc45484.2021.9683135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc45484.2021.9683135","pdf_url":null,"source":{"id":"https://openalex.org/S4363607724","display_name":"2021 60th IEEE Conference on Decision and Control (CDC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 60th IEEE Conference on Decision and Control (CDC)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2104.11434","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034366030","display_name":"Daniele Gammelli","orcid":"https://orcid.org/0000-0003-1802-4388"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Daniele Gammelli","raw_affiliation_strings":["Technical University of Denmark,DK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technical University of Denmark,DK","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075233338","display_name":"Kaidi Yang","orcid":"https://orcid.org/0000-0001-5120-2866"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaidi Yang","raw_affiliation_strings":["Stanford University,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stanford University,USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031821299","display_name":"J. Michael Harrison","orcid":"https://orcid.org/0000-0002-3657-2639"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James Harrison","raw_affiliation_strings":["Stanford University,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stanford University,USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078981714","display_name":"Filipe Rodrigues","orcid":"https://orcid.org/0000-0001-6979-6498"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Filipe Rodrigues","raw_affiliation_strings":["Technical University of Denmark,DK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technical University of Denmark,DK","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001424439","display_name":"Francisco C. Pereira","orcid":"https://orcid.org/0000-0001-5457-9909"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Francisco C. Pereira","raw_affiliation_strings":["Technical University of Denmark,DK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technical University of Denmark,DK","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050003000","display_name":"Marco Pavone","orcid":"https://orcid.org/0000-0002-0206-4337"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marco Pavone","raw_affiliation_strings":["Stanford University,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stanford University,USA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.4746,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.85609244,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2996","last_page":"3003"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10768","display_name":"Electric Vehicles and Infrastructure","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7845441699028015},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7257078886032104},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5505679249763489},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4881773591041565},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4800175726413727},{"id":"https://openalex.org/keywords/network-topology","display_name":"Network topology","score":0.4532403349876404},{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.437882661819458},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4326073229312897},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4187215268611908},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2515574097633362},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.16919153928756714}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7845441699028015},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7257078886032104},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5505679249763489},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4881773591041565},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4800175726413727},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.4532403349876404},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.437882661819458},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4326073229312897},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4187215268611908},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2515574097633362},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.16919153928756714},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/cdc45484.2021.9683135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc45484.2021.9683135","pdf_url":null,"source":{"id":"https://openalex.org/S4363607724","display_name":"2021 60th IEEE Conference on Decision and Control (CDC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 60th IEEE Conference on Decision and Control (CDC)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2104.11434","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2104.11434","pdf_url":"https://arxiv.org/pdf/2104.11434","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3157776331","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2104.11434","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:pure.atira.dk:publications/abe7b60a-ac86-4a39-9e77-e0a8c4023c16","is_oa":false,"landing_page_url":"https://orbit.dtu.dk/en/publications/abe7b60a-ac86-4a39-9e77-e0a8c4023c16","pdf_url":null,"source":{"id":"https://openalex.org/S4306400705","display_name":"Technical University of Denmark, DTU Orbit (Technical University of Denmark, DTU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I96673099","host_organization_name":"Technical University of Denmark","host_organization_lineage":["https://openalex.org/I96673099"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Gammelli , D , Yang , K , Harrison , J , Rodrigues , F , Pereira , F C &amp; Pavone , M 2021 , Graph Neural Network Reinforcement Learning for Autonomous Mobility-on-Demand Systems . in Proceedings of the 60th IEEE Conference on Decision and Control, CDC 2021 . Institute of Electrical and Electronics Engineers Inc. , pp. 2996-3003 , 60th IEEE Conference on Decision and Control , Austin , Texas , United States , 14/12/2021 . https://doi.org/10.1109/CDC45484.2021.9683135","raw_type":"contributionToPeriodical"},{"id":"doi:10.48550/arxiv.2104.11434","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2104.11434","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2104.11434","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2104.11434","pdf_url":"https://arxiv.org/pdf/2104.11434","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.7300000190734863,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null},{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3157776331.pdf","grobid_xml":"https://content.openalex.org/works/W3157776331.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W312709805","https://openalex.org/W855132903","https://openalex.org/W2051805534","https://openalex.org/W2119717200","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2147800946","https://openalex.org/W2263673729","https://openalex.org/W2318160089","https://openalex.org/W2558748708","https://openalex.org/W2612340487","https://openalex.org/W2736601468","https://openalex.org/W2803952469","https://openalex.org/W2915314538","https://openalex.org/W2963144120","https://openalex.org/W2964015378","https://openalex.org/W2964043796","https://openalex.org/W2964121744","https://openalex.org/W2970971581","https://openalex.org/W3002603762","https://openalex.org/W3003899243","https://openalex.org/W3010723966","https://openalex.org/W3042024951","https://openalex.org/W3083366259","https://openalex.org/W3088562575","https://openalex.org/W4239634521","https://openalex.org/W6631190155","https://openalex.org/W6692846177","https://openalex.org/W6726873649"],"related_works":["https://openalex.org/W2787739227","https://openalex.org/W3033858290","https://openalex.org/W3202198751","https://openalex.org/W2261683202","https://openalex.org/W2533925791","https://openalex.org/W2890172044","https://openalex.org/W3180195251","https://openalex.org/W2090787586","https://openalex.org/W2987890415","https://openalex.org/W3203944359","https://openalex.org/W3212257828","https://openalex.org/W2896733904","https://openalex.org/W3145768065","https://openalex.org/W2896451037","https://openalex.org/W2757927221","https://openalex.org/W2527698548","https://openalex.org/W2142839172","https://openalex.org/W2947287992","https://openalex.org/W3014720921","https://openalex.org/W3029523729"],"abstract_inverted_index":{"Autonomous":[0],"mobility-on-demand":[1],"(AMoD)":[2],"systems":[3,82],"represent":[4,39],"a":[5,18,26,62,71],"rapidly":[6],"developing":[7],"mode":[8],"of":[9,21,29,41,80],"transportation":[10,31],"wherein":[11],"travel":[12],"requests":[13],"are":[14,103],"dynamically":[15],"handled":[16],"by":[17],"coordinated":[19],"fleet":[20],"robotic,":[22],"self-driving":[23],"vehicles.":[24],"Given":[25],"graph":[27,84,91],"representation":[28],"the":[30,42,46,54,78,120],"network":[32],"-":[33,50],"one":[34],"where,":[35],"for":[36],"example,":[37],"nodes":[38],"areas":[40],"city,":[43],"and":[44,108,141],"edges":[45],"connectivity":[47],"between":[48],"them":[49],"we":[51,69,88,117],"argue":[52],"that":[53,90,102],"AMoD":[55,81],"control":[56,77],"problem":[57],"is":[58],"naturally":[59],"cast":[60],"as":[61,135],"node-wise":[63],"decision-making":[64],"problem.":[65],"In":[66],"this":[67],"paper,":[68],"propose":[70],"deep":[72],"reinforcement":[73,95],"learning":[74,96],"framework":[75],"to":[76,98,143],"rebalancing":[79],"through":[83,113],"neural":[85,92],"networks.":[86],"Crucially,":[87],"demonstrate":[89],"networks":[93],"enable":[94],"agents":[97],"recover":[99],"behavior":[100],"policies":[101,111,122],"significantly":[104],"more":[105],"transferable,":[106],"generalizable,":[107],"scalable":[109],"than":[110],"learned":[112,121],"other":[114],"approaches.":[115],"Empirically,":[116],"show":[118],"how":[119],"exhibit":[123],"promising":[124],"zero-shot":[125],"transfer":[126],"capabilities":[127],"when":[128],"faced":[129],"with":[130],"critical":[131],"portability":[132],"tasks":[133],"such":[134],"inter-city":[136],"generalization,":[137],"service":[138],"area":[139],"expansion,":[140],"adaptation":[142],"potentially":[144],"complex":[145],"urban":[146],"topologies.":[147]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
