{"id":"https://openalex.org/W2942735643","doi":"https://doi.org/10.1109/iros40897.2019.8968205","title":"Driving with Style: Inverse Reinforcement Learning in General-Purpose Planning for Automated Driving","display_name":"Driving with Style: Inverse Reinforcement Learning in General-Purpose Planning for Automated Driving","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W2942735643","doi":"https://doi.org/10.1109/iros40897.2019.8968205","mag":"2942735643"},"language":"en","primary_location":{"id":"doi:10.1109/iros40897.2019.8968205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1905.00229","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Sascha Rosbach","orcid":null},"institutions":[{"id":"https://openalex.org/I1319473763","display_name":"Volkswagen Group (Germany)","ror":"https://ror.org/01f3bhg26","country_code":"DE","type":"company","lineage":["https://openalex.org/I1319473763"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Sascha Rosbach","raw_affiliation_strings":["Volkswagen AG,Wolfsburg,Germany,38440"],"affiliations":[{"raw_affiliation_string":"Volkswagen AG,Wolfsburg,Germany,38440","institution_ids":["https://openalex.org/I1319473763"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Vinit James","orcid":null},"institutions":[{"id":"https://openalex.org/I1319473763","display_name":"Volkswagen Group (Germany)","ror":"https://ror.org/01f3bhg26","country_code":"DE","type":"company","lineage":["https://openalex.org/I1319473763"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Vinit James","raw_affiliation_strings":["Volkswagen AG,Wolfsburg,Germany,38440"],"affiliations":[{"raw_affiliation_string":"Volkswagen AG,Wolfsburg,Germany,38440","institution_ids":["https://openalex.org/I1319473763"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Simon Gro\u00dfjohann","orcid":null},"institutions":[{"id":"https://openalex.org/I1319473763","display_name":"Volkswagen Group (Germany)","ror":"https://ror.org/01f3bhg26","country_code":"DE","type":"company","lineage":["https://openalex.org/I1319473763"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Gro\u00dfjohann","raw_affiliation_strings":["Volkswagen AG,Wolfsburg,Germany,38440"],"affiliations":[{"raw_affiliation_string":"Volkswagen AG,Wolfsburg,Germany,38440","institution_ids":["https://openalex.org/I1319473763"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Silviu Homoceanu","orcid":null},"institutions":[{"id":"https://openalex.org/I1319473763","display_name":"Volkswagen Group (Germany)","ror":"https://ror.org/01f3bhg26","country_code":"DE","type":"company","lineage":["https://openalex.org/I1319473763"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Silviu Homoceanu","raw_affiliation_strings":["Volkswagen AG,Wolfsburg,Germany,38440"],"affiliations":[{"raw_affiliation_string":"Volkswagen AG,Wolfsburg,Germany,38440","institution_ids":["https://openalex.org/I1319473763"]}]},{"author_position":"last","author":{"id":null,"display_name":"Stefan Roth","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stefan Roth","raw_affiliation_strings":["Technische Universit&#x00E4;t Darmstadt,Visual Inference Lab,Darmstadt,64289"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Darmstadt,Visual Inference Lab,Darmstadt,64289","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I1319473763"],"apc_list":null,"apc_paid":null,"fwci":2.8011,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.90306744,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2658","last_page":"2665"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7081999778747559},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6075000166893005},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.6022999882698059},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4970000088214874},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.478300005197525},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.451200008392334},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.3698999881744385},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.3675999939441681}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7081999778747559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6535999774932861},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6349999904632568},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6075000166893005},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.6022999882698059},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4970000088214874},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.478300005197525},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.451200008392334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4496999979019165},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.3698999881744385},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3675999939441681},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.3521000146865845},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.35089999437332153},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.3098999857902527},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.30630001425743103},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3034000098705292},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C199190896","wikidata":"https://www.wikidata.org/wiki/Q3509276","display_name":"Learning classifier system","level":3,"score":0.2842000126838684},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.2800000011920929},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.272599995136261},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.26750001311302185},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2646999955177307},{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.26170000433921814}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros40897.2019.8968205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1905.00229","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1905.00229","pdf_url":"https://arxiv.org/pdf/1905.00229","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1905.00229","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1905.00229","pdf_url":"https://arxiv.org/pdf/1905.00229","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1527702126","https://openalex.org/W1919962963","https://openalex.org/W1999874108","https://openalex.org/W2142828048","https://openalex.org/W2155098712","https://openalex.org/W2169498096","https://openalex.org/W2192586580","https://openalex.org/W2343568200","https://openalex.org/W2511460750","https://openalex.org/W2530849036","https://openalex.org/W2565410644","https://openalex.org/W2744369598","https://openalex.org/W2749747771","https://openalex.org/W2783963507","https://openalex.org/W2800753541","https://openalex.org/W6674884181","https://openalex.org/W6691967218","https://openalex.org/W6696273291","https://openalex.org/W6752356361"],"related_works":[],"abstract_inverted_index":{"Behavior":[0],"and":[1,52,154,174],"motion":[2,16,54,61],"planning":[3,62],"play":[4],"an":[5,94,110],"important":[6,126],"role":[7],"in":[8,27,34],"automated":[9],"driving.":[10],"Traditionally,":[11],"behavior":[12,36,42,51],"planners":[13,17,37,46,58,135],"instruct":[14],"local":[15,53],"with":[18,136,166],"predefined":[19,41],"behaviors.":[20],"Due":[21],"to":[22,39,76,89,118,185],"the":[23,85,129,148,160,190],"high":[24],"scene":[25],"complexity":[26],"urban":[28],"environments,":[29],"unpredictable":[30],"situations":[31],"may":[32],"occur":[33],"which":[35],"fail":[38],"match":[40],"templates.":[43],"Recently,":[44],"general-purpose":[45,57,134],"have":[47],"been":[48],"introduced,":[49],"combining":[50],"planning.":[55],"These":[56],"allow":[59],"behavior-aware":[60],"given":[63],"a":[64,78,102],"single":[65],"reward":[66,86,99,121,176,187],"function.":[67],"However,":[68],"two":[69],"challenges":[70],"arise:":[71],"First,":[72],"this":[73,98,106],"function":[74,87,100],"has":[75,88],"map":[77],"complex":[79],"feature":[80],"space":[81],"into":[82,128],"rewards.":[83],"Second,":[84],"be":[90],"manually":[91],"tuned":[92],"by":[93],"expert.":[95],"Manually":[96],"tuning":[97,195],"becomes":[101],"tedious":[103],"task.":[104],"In":[105],"paper,":[107],"we":[108,158,182],"propose":[109],"approach":[111,145],"that":[112,181],"relies":[113],"on":[114,147],"human":[115,163],"driving":[116,130],"demonstrations":[117],"automatically":[119],"tune":[120],"functions.":[122,177],"This":[123],"study":[124],"offers":[125],"insights":[127],"style":[131],"optimization":[132],"of":[133,162,169,192],"maximum":[137],"entropy":[138],"inverse":[139],"reinforcement":[140],"learning.":[141],"We":[142],"evaluate":[143],"our":[144,170],"based":[146],"expected":[149],"value":[150],"difference":[151],"between":[152],"learned":[153,173],"demonstrated":[155],"policies.":[156],"Furthermore,":[157],"compare":[159],"similarity":[161],"driven":[164],"trajectories":[165],"optimal":[167],"policies":[168],"planner":[171],"under":[172],"expert-tuned":[175],"Our":[178],"experiments":[179],"show":[180],"are":[183],"able":[184],"learn":[186],"functions":[188],"exceeding":[189],"level":[191],"manual":[193],"expert":[194],"without":[196],"prior":[197],"domain":[198],"knowledge.":[199]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":5}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2019-05-09T00:00:00"}
