{"id":"https://openalex.org/W4394006698","doi":"https://doi.org/10.1109/mci.2024.3364428","title":"Encoding Distributional Soft Actor-Critic for Autonomous Driving in Multi-Lane Scenarios [Research Frontier]","display_name":"Encoding Distributional Soft Actor-Critic for Autonomous Driving in Multi-Lane Scenarios [Research Frontier]","publication_year":2024,"publication_date":"2024-04-05","ids":{"openalex":"https://openalex.org/W4394006698","doi":"https://doi.org/10.1109/mci.2024.3364428"},"language":"en","primary_location":{"id":"doi:10.1109/mci.2024.3364428","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mci.2024.3364428","pdf_url":null,"source":{"id":"https://openalex.org/S104797584","display_name":"IEEE Computational Intelligence Magazine","issn_l":"1556-603X","issn":["1556-603X","1556-6048"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computational Intelligence Magazine","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067909017","display_name":"Jingliang Duan","orcid":"https://orcid.org/0000-0002-3697-1576"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingliang Duan","raw_affiliation_strings":["University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3697-1576","affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007325049","display_name":"Yangang Ren","orcid":"https://orcid.org/0000-0002-1173-7230"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yangang Ren","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1173-7230","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103031147","display_name":"Fawang Zhang","orcid":"https://orcid.org/0009-0002-7455-9694"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fawang Zhang","raw_affiliation_strings":["Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-7455-9694","affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100696317","display_name":"Jie Li","orcid":"https://orcid.org/0000-0002-3718-5593"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3718-5593","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747108","display_name":"Shengbo Eben Li","orcid":"https://orcid.org/0000-0003-4923-3633"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengbo Eben Li","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4923-3633","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082794136","display_name":"Yang Guan","orcid":"https://orcid.org/0000-0003-0689-0510"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Guan","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0689-0510","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064709557","display_name":"Keqiang Li","orcid":"https://orcid.org/0000-0001-6223-5401"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keqiang Li","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6223-5401","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5067909017"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":7.6161,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.9762903,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"19","issue":"2","first_page":"96","last_page":"112"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9684000015258789,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9657999873161316,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7933032512664795},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.6475063562393188},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6392433643341064},{"id":"https://openalex.org/keywords/generality","display_name":"Generality","score":0.616722822189331},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.48205289244651794},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4683586657047272},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4442082643508911},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4345986247062683},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4292130172252655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7933032512664795},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.6475063562393188},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6392433643341064},{"id":"https://openalex.org/C2780767217","wikidata":"https://www.wikidata.org/wiki/Q5532421","display_name":"Generality","level":2,"score":0.616722822189331},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.48205289244651794},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4683586657047272},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4442082643508911},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4345986247062683},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4292130172252655},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mci.2024.3364428","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mci.2024.3364428","pdf_url":null,"source":{"id":"https://openalex.org/S104797584","display_name":"IEEE Computational Intelligence Magazine","issn_l":"1556-603X","issn":["1556-603X","1556-6048"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computational Intelligence Magazine","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1267632332","display_name":null,"funder_award_id":"FRF-OT-23-02","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4592020493","display_name":"Didi Joint Research Center for Future Mobility, Tsinghua University","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W2027197837","https://openalex.org/W2145339207","https://openalex.org/W2588289902","https://openalex.org/W2736601468","https://openalex.org/W2736791111","https://openalex.org/W2739529772","https://openalex.org/W2752236613","https://openalex.org/W2766447205","https://openalex.org/W2869375357","https://openalex.org/W2896288931","https://openalex.org/W2899663614","https://openalex.org/W2903709398","https://openalex.org/W2904246096","https://openalex.org/W2904263972","https://openalex.org/W2963322416","https://openalex.org/W2963625099","https://openalex.org/W2968983352","https://openalex.org/W2970065535","https://openalex.org/W2990123902","https://openalex.org/W3002044607","https://openalex.org/W3015082424","https://openalex.org/W3046214590","https://openalex.org/W3088218629","https://openalex.org/W3102270594","https://openalex.org/W3127561923","https://openalex.org/W3165559047","https://openalex.org/W3211345831","https://openalex.org/W4210870706","https://openalex.org/W4225390809","https://openalex.org/W4226275976","https://openalex.org/W4285071855","https://openalex.org/W4287617987","https://openalex.org/W4308080451","https://openalex.org/W4312876648","https://openalex.org/W4315588599","https://openalex.org/W4362650413","https://openalex.org/W4375929017","https://openalex.org/W4376481351","https://openalex.org/W6684921986","https://openalex.org/W6734517396","https://openalex.org/W6739901393","https://openalex.org/W6741002519","https://openalex.org/W6744580074","https://openalex.org/W6748839928","https://openalex.org/W6755977528","https://openalex.org/W6757592117","https://openalex.org/W6849153783"],"related_works":["https://openalex.org/W2372020181","https://openalex.org/W2156531654","https://openalex.org/W1581723585","https://openalex.org/W4378714697","https://openalex.org/W2294330161","https://openalex.org/W2940472653","https://openalex.org/W2253069048","https://openalex.org/W2804553224","https://openalex.org/W140709781","https://openalex.org/W3214340375"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,66,72],"new":[4],"reinforcement":[5],"learning":[6],"(RL)":[7],"algorithm,":[8],"called":[9],"encoding":[10,56,111],"distributional":[11,57,86],"soft":[12],"actor-critic":[13],"(E-DSAC),":[14],"for":[15,28,42],"decision-making":[16,23],"in":[17,48,84,99,175,201],"autonomous":[18,173],"driving.":[19],"Unlike":[20],"existing":[21],"RL-based":[22],"methods,":[24],"E-DSAC":[25,115,165,186],"is":[26,36,62,93,117],"suitable":[27],"situations":[29],"where":[30],"the":[31,40,79,85,109,114,121,126,130,135,139,144,152,155,161,176,180],"number":[32],"of":[33,81,101,125,134,154,189],"surrounding":[34],"vehicles":[35],"variable":[37],"and":[38,52,103,143,170],"eliminates":[39],"requirement":[41],"manually":[43],"pre-designed":[44],"sorting":[45],"rules,":[46],"resulting":[47],"higher":[49],"policy":[50,58,131,162,182],"performance":[51,183],"generality.":[53],"Firstly,":[54],"an":[55],"iteration":[59],"(DPI)":[60],"framework":[61,92],"developed":[63,110],"by":[64,119,164,185,191],"embedding":[65],"permutation":[67],"invariant":[68],"module,":[69],"which":[70],"employs":[71],"feature":[73,127],"neural":[74],"network":[75],"(NN)":[76],"to":[77,95,129,150],"encode":[78],"indicators":[80],"each":[82],"vehicle,":[83],"RL":[87],"framework.":[88],"The":[89],"proposed":[90,118,156],"DPI":[91,112],"proven":[94],"exhibit":[96],"important":[97],"properties":[98],"terms":[100],"convergence":[102],"global":[104],"optimality.":[105],"Next,":[106],"based":[107],"on":[108],"framework,":[113],"algorithm":[116],"adding":[120],"gradient-based":[122],"update":[123],"rule":[124],"NN":[128],"evaluation":[132],"process":[133],"DSAC":[136,190],"algorithm.":[137,157],"Then,":[138],"multi-lane":[140],"driving":[141,174],"task":[142],"corresponding":[145],"reward":[146],"function":[147],"are":[148],"designed":[149,177],"verify":[151],"effectiveness":[153,196],"Results":[158],"show":[159],"that":[160,188],"learned":[163],"can":[166],"realize":[167],"efficient,":[168],"smooth,":[169],"relatively":[171],"safe":[172],"scenario.":[178],"And":[179],"final":[181],"attained":[184],"surpasses":[187],"approximately":[192],"threefold.":[193],"Furthermore,":[194],"its":[195],"has":[197],"also":[198],"been":[199],"verified":[200],"real":[202],"vehicle":[203],"experiments.":[204]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":10}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
