{"id":"https://openalex.org/W3097267688","doi":"https://doi.org/10.1109/access.2020.3034225","title":"Hierarchical Reinforcement Learning for Autonomous Decision Making and Motion Planning of Intelligent Vehicles","display_name":"Hierarchical Reinforcement Learning for Autonomous Decision Making and Motion Planning of Intelligent Vehicles","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3097267688","doi":"https://doi.org/10.1109/access.2020.3034225","mag":"3097267688"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3034225","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034225","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09241055.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09241055.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102006100","display_name":"Yang Lu","orcid":"https://orcid.org/0000-0002-4023-3963"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Lu","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053112608","display_name":"Xin Xu","orcid":"https://orcid.org/0000-0003-3238-745X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Xu","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101668802","display_name":"Xinglong Zhang","orcid":"https://orcid.org/0000-0002-0587-2487"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinglong Zhang","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065246382","display_name":"Lilin Qian","orcid":"https://orcid.org/0000-0002-6227-9970"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lilin Qian","raw_affiliation_strings":["Unmanned System Technology Research Center, National Innovation Institute of Defense Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Unmanned System Technology Research Center, National Innovation Institute of Defense Technology, Beijing, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101851239","display_name":"Xing Zhou","orcid":"https://orcid.org/0000-0001-6358-1621"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xing Zhou","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102006100"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.1382,"has_fulltext":true,"cited_by_count":36,"citation_normalized_percentile":{"value":0.87116588,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"8","issue":null,"first_page":"209776","last_page":"209789"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.738862156867981},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7313275337219238},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6463401317596436},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6408474445343018},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5091778635978699},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.4631485342979431},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3438975512981415},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3421751856803894}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.738862156867981},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7313275337219238},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6463401317596436},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6408474445343018},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5091778635978699},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.4631485342979431},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3438975512981415},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3421751856803894}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3034225","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034225","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09241055.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:8404eb1734fd4f2fbe9ef3abc6709b17","is_oa":true,"landing_page_url":"https://doaj.org/article/8404eb1734fd4f2fbe9ef3abc6709b17","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 209776-209789 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3034225","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034225","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09241055.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7400000095367432,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1189737475","display_name":null,"funder_award_id":"2018YFB1305105","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3435950671","display_name":null,"funder_award_id":"and Gr","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G37568934","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3893329717","display_name":null,"funder_award_id":"Grant 2018YFB1305105","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5196624177","display_name":null,"funder_award_id":"61825305","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7457541925","display_name":null,"funder_award_id":"61751311","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8167847300","display_name":null,"funder_award_id":"2018YFB1305105","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8208342437","display_name":null,"funder_award_id":"1 and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3097267688.pdf","grobid_xml":"https://content.openalex.org/works/W3097267688.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W1578293866","https://openalex.org/W1971998222","https://openalex.org/W1996183429","https://openalex.org/W2000359213","https://openalex.org/W2003099253","https://openalex.org/W2003708116","https://openalex.org/W2012561930","https://openalex.org/W2023122515","https://openalex.org/W2028945152","https://openalex.org/W2032924574","https://openalex.org/W2046978863","https://openalex.org/W2055207897","https://openalex.org/W2071401582","https://openalex.org/W2099144379","https://openalex.org/W2108511252","https://openalex.org/W2116165149","https://openalex.org/W2118556122","https://openalex.org/W2128990851","https://openalex.org/W2132351269","https://openalex.org/W2133233905","https://openalex.org/W2135835974","https://openalex.org/W2144717132","https://openalex.org/W2163385431","https://openalex.org/W2167224731","https://openalex.org/W2169528473","https://openalex.org/W2306644740","https://openalex.org/W2342840547","https://openalex.org/W2556764949","https://openalex.org/W2559767995","https://openalex.org/W2586680856","https://openalex.org/W2896640299","https://openalex.org/W2905334533","https://openalex.org/W2953303875","https://openalex.org/W2962769637","https://openalex.org/W2963262099","https://openalex.org/W2964082383","https://openalex.org/W2967043083","https://openalex.org/W2967952682","https://openalex.org/W2992243386","https://openalex.org/W2996598994","https://openalex.org/W3004840042","https://openalex.org/W4236251699","https://openalex.org/W4285719527","https://openalex.org/W4293682399","https://openalex.org/W6662064237","https://openalex.org/W6679847170","https://openalex.org/W6679896305","https://openalex.org/W6684338915","https://openalex.org/W6703271639","https://openalex.org/W6704559304"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W2900413183","https://openalex.org/W4390975304","https://openalex.org/W147410782","https://openalex.org/W3022252430","https://openalex.org/W4287804464","https://openalex.org/W3103989898","https://openalex.org/W3211292372","https://openalex.org/W803346624"],"abstract_inverted_index":{"Autonomous":[0],"decision":[1,63,221],"making":[2,64,222],"and":[3,17,42,65,93,111,139,201,212,223],"motion":[4,40,66,105,224],"planning":[5,67,145,225],"in":[6,68,122,142,158,170,178,192,218,226],"complex":[7,69,193,227],"dynamic":[8,43,70,120],"traffic":[9,15,71,194,199],"environments,":[10],"such":[11],"as":[12],"left-turn":[13,197],"without":[14,198],"signals":[16,200],"multi-lane":[18,202],"merging":[19,203],"from":[20,184,204],"side-ways,":[21],"are":[22,115,190],"still":[23],"challenging":[24],"tasks":[25],"for":[26,61,99],"intelligent":[27,46],"vehicles.":[28,47],"It":[29],"is":[30,97,182],"difficult":[31],"to":[32],"generate":[33],"optimized":[34,220],"behavior":[35],"decisions":[36,133],"while":[37,174],"considering":[38],"the":[39,50,81,101,108,112,123,129,132,136,140,143,155,159,175,179,185,210,215],"capabilities":[41,106],"properties":[44],"of":[45,77,107,214],"Aiming":[48],"at":[49,135],"above":[51],"problems,":[52],"this":[53],"article":[54],"proposes":[55],"a":[56,84,118,163,171],"hierarchical":[57],"reinforcement":[58],"learning":[59],"approach":[60,75,217],"autonomous":[62],"scenarios.":[72,206],"The":[73,104,151,207],"proposed":[74,216],"consists":[76],"two":[78],"layers.":[79],"At":[80],"higher":[82,137,186],"layer,":[83],"kernel-based":[85],"least-squares":[86],"policy":[87],"iteration":[88],"algorithm":[89,168],"with":[90,117],"uneven":[91],"sampling":[92],"pooling":[94],"strategy":[95],"(USP-KLSPI)":[96],"presented":[98],"solving":[100],"decision-making":[102,124],"problems.":[103],"ego":[109],"vehicle":[110],"surrounding":[113],"vehicles":[114],"evaluated":[116],"high-fidelity":[119],"model":[121],"layer.":[125,187],"By":[126],"doing":[127],"so,":[128],"consistency":[130],"between":[131],"generated":[134],"layer":[138,146,153],"operations":[141],"lower":[144,152],"can":[147],"be":[148],"well":[149],"guaranteed.":[150],"addresses":[154],"motion-planning":[156],"problem":[157],"lateral":[160],"direction":[161,181],"using":[162],"dual":[164],"heuristic":[165],"programming":[166],"(DHP)":[167],"learned":[169],"batch-mode":[172],"manner,":[173],"velocity":[176],"profile":[177],"longitudinal":[180],"inherited":[183],"Extensive":[188],"simulations":[189],"conducted":[191],"conditions":[195],"including":[196],"side-ways":[205],"results":[208],"demonstrate":[209],"effectiveness":[211],"efficiency":[213],"realizing":[219],"environments.":[228]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
