{"id":"https://openalex.org/W3157893055","doi":"https://doi.org/10.1016/j.artint.2022.103829","title":"Reward (Mis)design for autonomous driving","display_name":"Reward (Mis)design for autonomous driving","publication_year":2022,"publication_date":"2022-12-13","ids":{"openalex":"https://openalex.org/W3157893055","doi":"https://doi.org/10.1016/j.artint.2022.103829","mag":"3157893055"},"language":"en","primary_location":{"id":"doi:10.1016/j.artint.2022.103829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.artint.2022.103829","pdf_url":null,"source":{"id":"https://openalex.org/S196139623","display_name":"Artificial Intelligence","issn_l":"0004-3702","issn":["0004-3702","1872-7921"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.artint.2022.103829","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056649746","display_name":"W. Bradley Knox","orcid":"https://orcid.org/0000-0002-6006-9523"},"institutions":[{"id":"https://openalex.org/I4210120115","display_name":"Robert Bosch (United States)","ror":"https://ror.org/02venad53","country_code":"US","type":"company","lineage":["https://openalex.org/I4210120115","https://openalex.org/I889804353"]},{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"W. Bradley Knox","raw_affiliation_strings":["Robert Bosch LLC , United States of America","The University of Texas at Austin, United States of America"],"raw_orcid":"https://orcid.org/0000-0002-6006-9523","affiliations":[{"raw_affiliation_string":"Robert Bosch LLC , United States of America","institution_ids":["https://openalex.org/I4210120115"]},{"raw_affiliation_string":"The University of Texas at Austin, United States of America","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059194708","display_name":"Alessandro Allievi","orcid":"https://orcid.org/0000-0001-5793-7679"},"institutions":[{"id":"https://openalex.org/I4210120115","display_name":"Robert Bosch (United States)","ror":"https://ror.org/02venad53","country_code":"US","type":"company","lineage":["https://openalex.org/I4210120115","https://openalex.org/I889804353"]},{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alessandro Allievi","raw_affiliation_strings":["Robert Bosch LLC , United States of America","The University of Texas at Austin, United States of America"],"raw_orcid":"https://orcid.org/0000-0001-5793-7679","affiliations":[{"raw_affiliation_string":"Robert Bosch LLC , United States of America","institution_ids":["https://openalex.org/I4210120115"]},{"raw_affiliation_string":"The University of Texas at Austin, United States of America","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085188713","display_name":"Holger Banzhaf","orcid":"https://orcid.org/0000-0003-2160-413X"},"institutions":[{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Holger Banzhaf","raw_affiliation_strings":["Robert Bosch GmbH, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH, Germany","institution_ids":["https://openalex.org/I889804353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101604340","display_name":"Felix Schmitt","orcid":"https://orcid.org/0000-0002-5411-5116"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Felix Schmitt","raw_affiliation_strings":["Bosch Center for Artificial Intelligence, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bosch Center for Artificial Intelligence, Germany","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001594330","display_name":"Peter Stone","orcid":"https://orcid.org/0000-0002-6795-420X"},"institutions":[{"id":"https://openalex.org/I2800278093","display_name":"Sony Corporation (United States)","ror":"https://ror.org/05k91zb11","country_code":"US","type":"company","lineage":["https://openalex.org/I2800278093"]},{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peter Stone","raw_affiliation_strings":["Sony AI, United States of America","The University of Texas at Austin, United States of America"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sony AI, United States of America","institution_ids":["https://openalex.org/I2800278093"]},{"raw_affiliation_string":"The University of Texas at Austin, United States of America","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5056649746"],"corresponding_institution_ids":["https://openalex.org/I4210120115","https://openalex.org/I86519309"],"apc_list":{"value":3670,"currency":"USD","value_usd":3670},"apc_paid":{"value":3670,"currency":"USD","value_usd":3670},"fwci":7.6903,"has_fulltext":false,"cited_by_count":75,"citation_normalized_percentile":{"value":0.98230841,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"316","issue":null,"first_page":"103829","last_page":"103829"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10042","display_name":"Neural and Behavioral Psychology Studies","score":0.9207000136375427,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10042","display_name":"Neural and Behavioral Psychology Studies","score":0.9207000136375427,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sanity","display_name":"Sanity","score":0.8393994569778442},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6506127119064331},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6481584310531616},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.6294906139373779},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5272582769393921},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.413998544216156},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.37332168221473694},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.325273334980011},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.32449373602867126},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3086603283882141},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11231860518455505}],"concepts":[{"id":"https://openalex.org/C2777607469","wikidata":"https://www.wikidata.org/wiki/Q2915214","display_name":"Sanity","level":2,"score":0.8393994569778442},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6506127119064331},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6481584310531616},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.6294906139373779},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5272582769393921},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.413998544216156},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.37332168221473694},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.325273334980011},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32449373602867126},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3086603283882141},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11231860518455505},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.artint.2022.103829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.artint.2022.103829","pdf_url":null,"source":{"id":"https://openalex.org/S196139623","display_name":"Artificial Intelligence","issn_l":"0004-3702","issn":["0004-3702","1872-7921"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.artint.2022.103829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.artint.2022.103829","pdf_url":null,"source":{"id":"https://openalex.org/S196139623","display_name":"Artificial Intelligence","issn_l":"0004-3702","issn":["0004-3702","1872-7921"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G136333438","display_name":null,"funder_award_id":"FAIN-2019844","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3694786146","display_name":null,"funder_award_id":"CPS-1739964","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3881771821","display_name":null,"funder_award_id":"N00014-18-2243","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G5029475413","display_name":null,"funder_award_id":"IIS-1724157","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8828030238","display_name":null,"funder_award_id":"W911NF-19-2-0333","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320310620","display_name":"University of Texas at Austin","ror":"https://ror.org/00hj54h04"},{"id":"https://openalex.org/F4320313876","display_name":"Robert Bosch (Australia) Pty","ror":null},{"id":"https://openalex.org/F4320320869","display_name":"Robert Bosch Stiftung","ror":"https://ror.org/012kqkf58"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":109,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W398859631","https://openalex.org/W569478347","https://openalex.org/W1499408472","https://openalex.org/W1777239053","https://openalex.org/W1929981607","https://openalex.org/W1951419471","https://openalex.org/W1982640125","https://openalex.org/W2056354534","https://openalex.org/W2061562262","https://openalex.org/W2098774185","https://openalex.org/W2102660061","https://openalex.org/W2121863487","https://openalex.org/W2122410182","https://openalex.org/W2129286663","https://openalex.org/W2130750514","https://openalex.org/W2144846366","https://openalex.org/W2151382427","https://openalex.org/W2159600763","https://openalex.org/W2160519132","https://openalex.org/W2186544110","https://openalex.org/W2462906003","https://openalex.org/W2472097883","https://openalex.org/W2483227611","https://openalex.org/W2525579820","https://openalex.org/W2534225927","https://openalex.org/W2592285292","https://openalex.org/W2599174273","https://openalex.org/W2620908320","https://openalex.org/W2620974420","https://openalex.org/W2623293810","https://openalex.org/W2755893646","https://openalex.org/W2783058961","https://openalex.org/W2785324569","https://openalex.org/W2805560727","https://openalex.org/W2837605352","https://openalex.org/W2869375357","https://openalex.org/W2898696016","https://openalex.org/W2904263972","https://openalex.org/W2927638312","https://openalex.org/W2947981406","https://openalex.org/W2962782357","https://openalex.org/W2962867954","https://openalex.org/W2962937519","https://openalex.org/W2963259955","https://openalex.org/W2963508354","https://openalex.org/W2963625099","https://openalex.org/W2963646405","https://openalex.org/W2964061993","https://openalex.org/W2964263543","https://openalex.org/W2964321288","https://openalex.org/W2968983352","https://openalex.org/W2970065535","https://openalex.org/W2978329087","https://openalex.org/W2990123902","https://openalex.org/W2991030916","https://openalex.org/W2998674842","https://openalex.org/W3005850366","https://openalex.org/W3006334608","https://openalex.org/W3023742835","https://openalex.org/W3027820740","https://openalex.org/W3034445502","https://openalex.org/W3102797050","https://openalex.org/W3103379718","https://openalex.org/W3121342653","https://openalex.org/W3127561923","https://openalex.org/W3130519362","https://openalex.org/W3147079603","https://openalex.org/W3149322120","https://openalex.org/W4231910836","https://openalex.org/W4239213227","https://openalex.org/W4241648823","https://openalex.org/W4245976051","https://openalex.org/W4255556797","https://openalex.org/W4285719527","https://openalex.org/W4300091631","https://openalex.org/W6638088447","https://openalex.org/W6674884181","https://openalex.org/W6682205418","https://openalex.org/W6683408100","https://openalex.org/W6683818699","https://openalex.org/W6720376148","https://openalex.org/W6735028971","https://openalex.org/W6738700159","https://openalex.org/W6739055881","https://openalex.org/W6739585900","https://openalex.org/W6743368274","https://openalex.org/W6745347688","https://openalex.org/W6745935785","https://openalex.org/W6748210908","https://openalex.org/W6752818208","https://openalex.org/W6752961934","https://openalex.org/W6753398287","https://openalex.org/W6755198365","https://openalex.org/W6756319914","https://openalex.org/W6756817394","https://openalex.org/W6758417531","https://openalex.org/W6760984284","https://openalex.org/W6761908843","https://openalex.org/W6763196849","https://openalex.org/W6763250322","https://openalex.org/W6766637160","https://openalex.org/W6770856692","https://openalex.org/W6771278216","https://openalex.org/W6773009993","https://openalex.org/W6773319185","https://openalex.org/W6777179232","https://openalex.org/W6785888886","https://openalex.org/W6788546958"],"related_works":["https://openalex.org/W4254131102","https://openalex.org/W2335233058","https://openalex.org/W2363707454","https://openalex.org/W4391879671","https://openalex.org/W2319595751","https://openalex.org/W4383823969","https://openalex.org/W3120570282","https://openalex.org/W2372667816","https://openalex.org/W3105199192","https://openalex.org/W4399927518"],"abstract_inverted_index":{"This":[0],"article":[1],"considers":[2],"the":[3,19,68,87,96,132],"problem":[4],"of":[5,21,134,145],"diagnosing":[6],"certain":[7],"common":[8,31],"errors":[9],"in":[10,42,51,72,80,86,108,139],"reward":[11,43,70,78,103,109,119,135],"design.":[12],"Its":[13],"insights":[14],"are":[15],"also":[16,115],"applicable":[17],"to":[18,100,151],"design":[20,110,120,133],"cost":[22],"functions":[23,79,136],"and":[24,54,75,83],"performance":[25],"metrics":[26],"more":[27],"generally.":[28],"To":[29],"diagnose":[30],"errors,":[32],"we":[33,65,90,94,125],"develop":[34],"8":[35,97],"simple":[36],"sanity":[37,98],"checks":[38,99],"for":[39,60,111,121,137],"identifying":[40],"flaws":[41,107],"functions.":[44],"We":[45],"survey":[46],"research":[47],"that":[48,113,129,147],"is":[49],"published":[50],"top-tier":[52],"venues":[53],"focuses":[55],"on":[56],"reinforcement":[57],"learning":[58],"(RL)":[59],"autonomous":[61],"driving":[62],"(AD).":[63],"Specifically,":[64],"closely":[66],"examine":[67],"reported":[69],"function":[71],"each":[73,101],"publication":[74],"present":[76],"these":[77],"a":[81,143],"complete":[82],"standardized":[84],"format":[85],"appendix.":[88],"Wherever":[89],"have":[91],"sufficient":[92],"information,":[93],"apply":[95],"surveyed":[102],"function,":[104],"revealing":[105],"near-universal":[106],"AD":[112,138],"might":[114],"exist":[116],"pervasively":[117],"across":[118],"other":[122,152],"tasks.":[123],"Lastly,":[124],"explore":[126],"promising":[127],"directions":[128],"may":[130],"aid":[131],"subsequent":[140],"research,":[141],"following":[142],"process":[144],"inquiry":[146],"can":[148],"be":[149],"adapted":[150],"domains.":[153]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":24},{"year":2024,"cited_by_count":31},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3}],"updated_date":"2026-05-29T09:21:14.243279","created_date":"2025-10-10T00:00:00"}
