{"id":"https://openalex.org/W4290943640","doi":"https://doi.org/10.1145/3534678.3539180","title":"Graph Meta-Reinforcement Learning for Transferable Autonomous Mobility-on-Demand","display_name":"Graph Meta-Reinforcement Learning for Transferable Autonomous Mobility-on-Demand","publication_year":2022,"publication_date":"2022-08-12","ids":{"openalex":"https://openalex.org/W4290943640","doi":"https://doi.org/10.1145/3534678.3539180"},"language":"en","primary_location":{"id":"doi:10.1145/3534678.3539180","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3534678.3539180","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3534678.3539180","source":{"id":"https://openalex.org/S4363608767","display_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3534678.3539180","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034366030","display_name":"Daniele Gammelli","orcid":"https://orcid.org/0000-0003-1802-4388"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Daniele Gammelli","raw_affiliation_strings":["Technical University of Denmark, Kgs. Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Technical University of Denmark, Kgs. Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075233338","display_name":"Kaidi Yang","orcid":"https://orcid.org/0000-0001-5120-2866"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaidi Yang","raw_affiliation_strings":["Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031821299","display_name":"J. Michael Harrison","orcid":"https://orcid.org/0000-0002-3657-2639"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James Harrison","raw_affiliation_strings":["Google Research, Brain Team, San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google Research, Brain Team, San Francisco, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078981714","display_name":"Filipe Rodrigues","orcid":"https://orcid.org/0000-0001-6979-6498"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Filipe Rodrigues","raw_affiliation_strings":["Technical University of Denmark, Kgs. Lyngby , Denmark"],"affiliations":[{"raw_affiliation_string":"Technical University of Denmark, Kgs. Lyngby , Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001424439","display_name":"Francisco C. Pereira","orcid":"https://orcid.org/0000-0001-5457-9909"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Francisco Pereira","raw_affiliation_strings":["Technical University of Denmark, Kgs. Lyngby , Denmark"],"affiliations":[{"raw_affiliation_string":"Technical University of Denmark, Kgs. Lyngby , Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050003000","display_name":"Marco Pavone","orcid":"https://orcid.org/0000-0002-0206-4337"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marco Pavone","raw_affiliation_strings":["Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5034366030"],"corresponding_institution_ids":["https://openalex.org/I96673099"],"apc_list":null,"apc_paid":null,"fwci":3.8944,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.96290323,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2913","last_page":"2923"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7760767936706543},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7132213711738586},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.4649476110935211},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.33826494216918945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26480597257614136},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14343911409378052}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7760767936706543},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7132213711738586},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.4649476110935211},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.33826494216918945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26480597257614136},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14343911409378052},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C136264566","wikidata":"https://www.wikidata.org/wiki/Q159810","display_name":"Economy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3534678.3539180","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3534678.3539180","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3534678.3539180","source":{"id":"https://openalex.org/S4363608767","display_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3534678.3539180","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3534678.3539180","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3534678.3539180","source":{"id":"https://openalex.org/S4363608767","display_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.7699999809265137}],"awards":[{"id":"https://openalex.org/G1471419679","display_name":null,"funder_award_id":"P400P2_199332","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G1650660105","display_name":"Design and Operation of AV-Enabled Mobility-on-Demand Systems","funder_award_id":"199332","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G2962877871","display_name":null,"funder_award_id":"1837135","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G45908958","display_name":null,"funder_award_id":"Mobility","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G4621158401","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G6894402473","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4290943640.pdf","grobid_xml":"https://content.openalex.org/works/W4290943640.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W126628216","https://openalex.org/W1890688605","https://openalex.org/W1988580225","https://openalex.org/W2089076789","https://openalex.org/W2095818975","https://openalex.org/W2157331557","https://openalex.org/W2260756217","https://openalex.org/W2296638040","https://openalex.org/W2552391307","https://openalex.org/W2604763608","https://openalex.org/W2612340487","https://openalex.org/W2803952469","https://openalex.org/W2911752602","https://openalex.org/W2915314538","https://openalex.org/W2963144120","https://openalex.org/W3002603762","https://openalex.org/W3003899243","https://openalex.org/W3015295488","https://openalex.org/W3022566517","https://openalex.org/W3088562575","https://openalex.org/W3089834075","https://openalex.org/W3155841317","https://openalex.org/W3176602965","https://openalex.org/W3186668962","https://openalex.org/W3210183837","https://openalex.org/W4206788904","https://openalex.org/W4214717370","https://openalex.org/W4226047880","https://openalex.org/W4231927217","https://openalex.org/W4411187082","https://openalex.org/W6639683144","https://openalex.org/W6640593155","https://openalex.org/W6663073678","https://openalex.org/W6677916085","https://openalex.org/W6751575707"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109"],"abstract_inverted_index":{"Autonomous":[0],"Mobility-on-Demand":[1],"(AMoD)":[2],"systems":[3,29,56],"represent":[4],"an":[5,71,142],"attractive":[6],"alternative":[7],"to":[8,33,39,59,69,89,127,186,205,210],"existing":[9],"transportation":[10,80],"paradigms,":[11],"currently":[12,37],"challenged":[13],"by":[14,193],"urbanization":[15],"and":[16,35,140,223],"increasing":[17],"travel":[18],"needs.":[19],"By":[20],"centrally":[21],"controlling":[22,54],"a":[23,43,105,117,161,167],"fleet":[24],"of":[25,45,74,108,136,164],"self-driving":[26],"vehicles,":[27],"these":[28,123],"provide":[30],"mobility":[31],"service":[32,65],"customers":[34],"are":[36,57,156,184],"starting":[38],"be":[40],"deployed":[41],"in":[42,104,214],"number":[44,107],"cities":[46,192],"around":[47],"the":[48,60,64,78,114,129,134],"world.":[49],"Current":[50],"learning-based":[51],"approaches":[52],"for":[53,94],"AMoD":[55,92,131,154],"limited":[58],"single-city":[61,115],"scenario,":[62],"whereby":[63],"operator":[66],"is":[67],"allowed":[68],"take":[70],"unlimited":[72],"amount":[73,163],"operational":[75],"decisions":[76,110],"within":[77,166],"same":[79],"system.":[81],"However,":[82],"real-world":[83,215],"system":[84,173],"operators":[85],"can":[86],"hardly":[87],"afford":[88],"fully":[90],"re-train":[91],"controllers":[93,155],"every":[95],"city":[96,169],"they":[97],"operate":[98],"in,":[99],"as":[100,218],"this":[101],"could":[102],"result":[103],"high":[106],"poor-quality":[109],"during":[111],"training,":[112],"making":[113,199],"strategy":[116],"potentially":[118],"impractical":[119],"solution.":[120],"To":[121],"address":[122],"limitations,":[124],"we":[125,176],"propose":[126],"formalize":[128],"multi-city":[130],"problem":[132],"through":[133,182],"lens":[135],"meta-reinforcement":[137],"learning":[138,194],"(meta-RL)":[139],"devise":[141],"actor-critic":[143],"algorithm":[144],"based":[145],"on":[146,190],"recurrent":[147],"graph":[148],"neural":[149],"networks.":[150],"In":[151],"our":[152],"approach,":[153],"explicitly":[157],"trained":[158],"such":[159,217],"that":[160],"small":[162],"experience":[165],"new":[168],"will":[170],"produce":[171],"good":[172],"performance.":[174],"Empirically,":[175],"show":[177],"how":[178],"control":[179],"policies":[180],"learned":[181],"meta-RL":[183],"able":[185],"achieve":[187],"near-optimal":[188],"performance":[189],"unseen":[191],"rapidly":[195],"adaptable":[196],"policies,":[197],"thus":[198],"them":[200],"more":[201],"robust":[202],"not":[203],"only":[204],"novel":[206],"environments,":[207],"but":[208],"also":[209],"distribution":[211],"shifts":[212],"common":[213],"operations,":[216],"special":[219],"events,":[220],"unexpected":[221],"congestion,":[222],"dynamic":[224],"pricing":[225],"schemes.":[226]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-10-10T00:00:00"}
