{"id":"https://openalex.org/W4390547633","doi":"https://doi.org/10.1109/lcsys.2024.3349511","title":"Developing Driving Strategies Efficiently: A Skill-Based Hierarchical Reinforcement Learning Approach","display_name":"Developing Driving Strategies Efficiently: A Skill-Based Hierarchical Reinforcement Learning Approach","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4390547633","doi":"https://doi.org/10.1109/lcsys.2024.3349511"},"language":"en","primary_location":{"id":"doi:10.1109/lcsys.2024.3349511","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lcsys.2024.3349511","pdf_url":null,"source":{"id":"https://openalex.org/S4306422535","display_name":"IEEE Control Systems Letters","issn_l":"2475-1456","issn":["2475-1456"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Control Systems Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053037902","display_name":"Yi\u011fit G\u00fcrses","orcid":"https://orcid.org/0009-0008-3367-7495"},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Yigit Gurses","raw_affiliation_strings":["Department of Computer Engineering, Bilkent University, Ankara, Turkey"],"raw_orcid":"https://orcid.org/0009-0008-3367-7495","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Bilkent University, Ankara, Turkey","institution_ids":["https://openalex.org/I168864056"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047511859","display_name":"Kaan Buyukdemirci","orcid":null},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Kaan Buyukdemirci","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Bilkent University, Ankara, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Bilkent University, Ankara, Turkey","institution_ids":["https://openalex.org/I168864056"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014536360","display_name":"Y\u0131ld\u0131ray Y\u0131ld\u0131z","orcid":"https://orcid.org/0000-0001-6270-5354"},"institutions":[{"id":"https://openalex.org/I168864056","display_name":"Bilkent University","ror":"https://ror.org/02vh8a032","country_code":"TR","type":"education","lineage":["https://openalex.org/I168864056"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Yildiray Yildiz","raw_affiliation_strings":["Department of Mechanical Engineering, Bilkent University, Ankara, Turkey"],"raw_orcid":"https://orcid.org/0000-0001-6270-5354","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Bilkent University, Ankara, Turkey","institution_ids":["https://openalex.org/I168864056"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053037902"],"corresponding_institution_ids":["https://openalex.org/I168864056"],"apc_list":null,"apc_paid":null,"fwci":1.8998,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.84147913,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"8","issue":null,"first_page":"121","last_page":"126"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10525","display_name":"Human-Automation Interaction and Safety","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8506723642349243},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7469173073768616},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7370633482933044},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.6607320308685303},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.6219587326049805},{"id":"https://openalex.org/keywords/high-fidelity","display_name":"High fidelity","score":0.5646750330924988},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5067194104194641},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4774382710456848},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4421161413192749},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.405911386013031},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35020455718040466},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15075376629829407},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.0742962658405304}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8506723642349243},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7469173073768616},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7370633482933044},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.6607320308685303},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.6219587326049805},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.5646750330924988},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5067194104194641},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4774382710456848},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4421161413192749},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.405911386013031},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35020455718040466},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15075376629829407},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0742962658405304},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lcsys.2024.3349511","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lcsys.2024.3349511","pdf_url":null,"source":{"id":"https://openalex.org/S4306422535","display_name":"IEEE Control Systems Letters","issn_l":"2475-1456","issn":["2475-1456"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Control Systems Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W2111876879","https://openalex.org/W2583993537","https://openalex.org/W2766034338","https://openalex.org/W2766258251","https://openalex.org/W2766447205","https://openalex.org/W2781726626","https://openalex.org/W2897697565","https://openalex.org/W2902907165","https://openalex.org/W2949267040","https://openalex.org/W2953326529","https://openalex.org/W2963322416","https://openalex.org/W2963438456","https://openalex.org/W2963523627","https://openalex.org/W2964227312","https://openalex.org/W2968202530","https://openalex.org/W2989847975","https://openalex.org/W2990123902","https://openalex.org/W2996037775","https://openalex.org/W3002044607","https://openalex.org/W3100944043","https://openalex.org/W3118210634","https://openalex.org/W3127561923","https://openalex.org/W3132674603","https://openalex.org/W3168892396","https://openalex.org/W3174288549","https://openalex.org/W3209253128","https://openalex.org/W3214229832","https://openalex.org/W4205780117","https://openalex.org/W4288055678","https://openalex.org/W4288289109","https://openalex.org/W4298845604","https://openalex.org/W4320449037","https://openalex.org/W6631943919","https://openalex.org/W6675945467","https://openalex.org/W6734215269","https://openalex.org/W6745174960","https://openalex.org/W6747473740","https://openalex.org/W6748440607","https://openalex.org/W6748603076","https://openalex.org/W6756319914","https://openalex.org/W6764724164","https://openalex.org/W6765240361","https://openalex.org/W6772005887","https://openalex.org/W6791000347","https://openalex.org/W6791194670","https://openalex.org/W6840583796","https://openalex.org/W6848961728","https://openalex.org/W6884300163"],"related_works":["https://openalex.org/W4313443006","https://openalex.org/W2945374968","https://openalex.org/W4385452045","https://openalex.org/W4293777179","https://openalex.org/W2164070813","https://openalex.org/W2135608140","https://openalex.org/W4224231624","https://openalex.org/W2319626700","https://openalex.org/W3099598016","https://openalex.org/W4319589573"],"abstract_inverted_index":{"Driving":[0],"in":[1,80,117],"dense":[2],"traffic":[3],"with":[4,112,133],"human":[5,34],"and":[6,17,26,74,96],"autonomous":[7,46],"drivers":[8,20],"is":[9,56],"a":[10,57,118],"challenging":[11],"task":[12,24],"that":[13,108,122,129],"requires":[14],"high-level":[15,99],"planning":[16],"reasoning.":[18],"Human":[19],"can":[21,39,70],"achieve":[22,130],"this":[23,78,81],"comfortably,":[25],"there":[27],"has":[28],"been":[29],"many":[30],"efforts":[31],"to":[32,50,60,137],"model":[33,61],"driver":[35,62,127],"strategies.":[36],"These":[37],"strategies":[38],"be":[40,71],"used":[41,97],"as":[42,98],"inspirations":[43],"for":[44,106],"developing":[45],"driving":[47,87],"algorithms":[48],"or":[49],"create":[51],"high-fidelity":[52],"simulators.":[53],"Reinforcement":[54],"learning":[55,140],"common":[58],"tool":[59],"policies,":[63],"but":[64],"conventional":[65],"training":[66,104,135],"of":[67],"these":[68],"models":[69,111,128],"computationally":[72],"expensive":[73],"time-consuming.":[75],"To":[76],"address":[77],"issue,":[79],"letter,":[82],"we":[83],"propose":[84],"\u201cskill-based\u201d":[85],"hierarchical":[86],"strategies,":[88],"where":[89],"motion":[90],"primitives,":[91],"i.e.,":[92],"skills,":[93],"are":[94],"designed":[95],"actions.":[100],"This":[101],"reduces":[102],"the":[103,123],"time":[105],"applications":[107],"require":[109],"multiple":[110],"varying":[113],"behavior.":[114],"Simulation":[115],"results":[116],"merging":[119],"scenario":[120],"demonstrate":[121],"proposed":[124],"approach":[125],"yields":[126],"higher":[131],"performance":[132],"less":[134],"compared":[136],"baseline":[138],"reinforcement":[139],"methods.":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":4}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
