{"id":"https://openalex.org/W3137786033","doi":"https://doi.org/10.1109/tits.2021.3096998","title":"Hierarchical Program-Triggered Reinforcement Learning Agents for Automated Driving","display_name":"Hierarchical Program-Triggered Reinforcement Learning Agents for Automated Driving","publication_year":2021,"publication_date":"2021-07-27","ids":{"openalex":"https://openalex.org/W3137786033","doi":"https://doi.org/10.1109/tits.2021.3096998","mag":"3137786033"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2021.3096998","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2021.3096998","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.13861","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030381913","display_name":"Briti Gangopadhyay","orcid":"https://orcid.org/0000-0002-6488-9326"},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Briti Gangopadhyay","raw_affiliation_strings":["Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India"],"raw_orcid":"https://orcid.org/0000-0002-6488-9326","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062893916","display_name":"Harshit Soora","orcid":null},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Harshit Soora","raw_affiliation_strings":["Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033329960","display_name":"Pallab Dasgupta","orcid":"https://orcid.org/0000-0002-2178-8154"},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Pallab Dasgupta","raw_affiliation_strings":["Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India"],"raw_orcid":"https://orcid.org/0000-0002-2178-8154","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, IIT Kharagpur, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.1615,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.91530604,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"23","issue":"8","first_page":"10902","last_page":"10911"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8878271579742432},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.7092618942260742},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6981887817382812},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6154102087020874},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5077499151229858},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5056328773498535},{"id":"https://openalex.org/keywords/crash","display_name":"Crash","score":0.49007999897003174},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.444879412651062},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38285189867019653},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.18783798813819885},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.13117974996566772},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12374421954154968},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.09298139810562134}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8878271579742432},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.7092618942260742},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6981887817382812},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6154102087020874},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5077499151229858},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5056328773498535},{"id":"https://openalex.org/C183469790","wikidata":"https://www.wikidata.org/wiki/Q333501","display_name":"Crash","level":2,"score":0.49007999897003174},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.444879412651062},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38285189867019653},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.18783798813819885},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.13117974996566772},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12374421954154968},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.09298139810562134},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tits.2021.3096998","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2021.3096998","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2103.13861","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.13861","pdf_url":"https://arxiv.org/pdf/2103.13861","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.13861","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.13861","pdf_url":"https://arxiv.org/pdf/2103.13861","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.8199999928474426,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W1489391022","https://openalex.org/W1498432697","https://openalex.org/W1507116188","https://openalex.org/W1592847719","https://openalex.org/W1600438913","https://openalex.org/W1864649459","https://openalex.org/W1971259793","https://openalex.org/W1994530392","https://openalex.org/W2023808162","https://openalex.org/W2055207897","https://openalex.org/W2151977651","https://openalex.org/W2167224731","https://openalex.org/W2192586580","https://openalex.org/W2257979135","https://openalex.org/W2335959470","https://openalex.org/W2342840547","https://openalex.org/W2462906003","https://openalex.org/W2518731509","https://openalex.org/W2530849036","https://openalex.org/W2583993537","https://openalex.org/W2736791111","https://openalex.org/W2749747771","https://openalex.org/W2787196707","https://openalex.org/W2837605352","https://openalex.org/W2883459807","https://openalex.org/W2897007254","https://openalex.org/W2897676672","https://openalex.org/W2899455150","https://openalex.org/W2905249540","https://openalex.org/W2950935200","https://openalex.org/W2962867954","https://openalex.org/W2963262099","https://openalex.org/W2963709735","https://openalex.org/W2964043796","https://openalex.org/W2964168984","https://openalex.org/W2968202530","https://openalex.org/W2968983352","https://openalex.org/W2971510799","https://openalex.org/W2980133010","https://openalex.org/W2995120596","https://openalex.org/W3001665214","https://openalex.org/W3002044607","https://openalex.org/W3004129452","https://openalex.org/W3004135535","https://openalex.org/W3028335312","https://openalex.org/W3092220800","https://openalex.org/W3100944043","https://openalex.org/W3118975573","https://openalex.org/W3127561923","https://openalex.org/W4293682399","https://openalex.org/W4295719664","https://openalex.org/W4297781990","https://openalex.org/W4301501993","https://openalex.org/W6684338915","https://openalex.org/W6692846177","https://openalex.org/W6704559304","https://openalex.org/W6718836005","https://openalex.org/W6728155968","https://openalex.org/W6743333067","https://openalex.org/W6745935785","https://openalex.org/W6748571143","https://openalex.org/W6771648948","https://openalex.org/W6773165671"],"related_works":["https://openalex.org/W2905433371","https://openalex.org/W2888392564","https://openalex.org/W4310278675","https://openalex.org/W4388422664","https://openalex.org/W4390569940","https://openalex.org/W4361193272","https://openalex.org/W2963326959","https://openalex.org/W4388685194","https://openalex.org/W4312407344","https://openalex.org/W2894289927"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,15,26],"Reinforcement":[3,42,67],"Learning":[4,9,43],"(RL)":[5],"combined":[6],"with":[7,79],"Deep":[8,41],"(DL)":[10],"have":[11],"demonstrated":[12,129],"impressive":[13],"performance":[14],"complex":[16,59,120],"tasks,":[17,60,133],"including":[18],"autonomous":[19,27],"driving.":[20],"The":[21,91,123],"use":[22],"of":[23,40,52,74,93,125],"RL":[24,55,81,105,121],"agents":[25,56],"driving":[28,34,132],"leads":[29],"to":[30,57,85,96,108,118],"a":[31,46,71,75,87,109,119],"smooth":[32],"human-like":[33],"experience,":[35],"but":[36],"the":[37,97,104,126],"limited":[38],"interpretability":[39],"(DRL)":[44],"creates":[45],"verification":[47,94],"and":[48,113,134],"certification":[49],"bottleneck.":[50],"Instead":[51],"relying":[53],"on":[54,130],"learn":[58],"we":[61],"propose":[62],"HPRL":[63],"-":[64],"Hierarchical":[65],"Program-triggered":[66],"Learning,":[68],"which":[69],"uses":[70],"hierarchy":[72],"consisting":[73],"structured":[76],"program":[77,99],"along":[78],"multiple":[80],"agents,":[82,106],"each":[83],"trained":[84],"perform":[86],"relatively":[88],"simple":[89,101],"task.":[90],"focus":[92],"shifts":[95],"master":[98],"under":[100],"guarantees":[102],"from":[103],"leading":[107],"significantly":[110],"more":[111],"interpretable":[112],"verifiable":[114],"implementation":[115],"as":[116],"compared":[117],"agent.":[122],"evaluation":[124],"framework":[127],"is":[128],"different":[131],"National":[135],"Highway":[136],"Traffic":[137],"Safety":[138],"Administration":[139],"(NHTSA)":[140],"pre-crash":[141],"scenarios":[142],"using":[143],"CARLA,":[144],"an":[145],"open-source":[146],"dynamic":[147],"urban":[148],"simulation":[149],"environment.":[150]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2021-03-29T00:00:00"}
