{"id":"https://openalex.org/W4391770221","doi":"https://doi.org/10.1109/itsc57777.2023.10422557","title":"Efficient-Enhanced Reinforcement Learning for Autonomous Driving in Urban Traffic Scenarios","display_name":"Efficient-Enhanced Reinforcement Learning for Autonomous Driving in Urban Traffic Scenarios","publication_year":2023,"publication_date":"2023-09-24","ids":{"openalex":"https://openalex.org/W4391770221","doi":"https://doi.org/10.1109/itsc57777.2023.10422557"},"language":"en","primary_location":{"id":"doi:10.1109/itsc57777.2023.10422557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111261067","display_name":"Jianwen Yin","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jianwen Yin","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005920411","display_name":"Zhengmin Jiang","orcid":"https://orcid.org/0000-0002-6498-0234"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengmin Jiang","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101246522","display_name":"Qingyi Liang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingyi Liang","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","Southern University of Science and Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100400663","display_name":"Wenfei Li","orcid":"https://orcid.org/0000-0002-3967-0058"},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenfei Li","raw_affiliation_strings":["Research Institute of Interdisciplinary,Research center for intelligent transportation, Zhejiang lab,Hangzhou,China,311121"],"affiliations":[{"raw_affiliation_string":"Research Institute of Interdisciplinary,Research center for intelligent transportation, Zhejiang lab,Hangzhou,China,311121","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106482136","display_name":"Zhongming Pan","orcid":"https://orcid.org/0009-0005-8527-1129"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongming Pan","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100614997","display_name":"Huiyun Li","orcid":"https://orcid.org/0000-0003-0157-1393"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huiyun Li","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079510458","display_name":"Jia Liu","orcid":"https://orcid.org/0000-0003-2363-8798"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Liu","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,CAS Key Laboratory of Human-Machine Intelligence-Synergy Systems,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111261067"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210145761","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.9391,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.76166186,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"887","last_page":"893"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.965399980545044,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9632999897003174,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8563894033432007},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.614537239074707},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.4926357865333557},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4117944836616516},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35461944341659546},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31172043085098267},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23624083399772644}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8563894033432007},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.614537239074707},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.4926357865333557},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4117944836616516},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35461944341659546},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31172043085098267},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23624083399772644},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/itsc57777.2023.10422557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2580495915","https://openalex.org/W2736601468","https://openalex.org/W2765302304","https://openalex.org/W2837605352","https://openalex.org/W2904246096","https://openalex.org/W2963679616","https://openalex.org/W2983617607","https://openalex.org/W2990123902","https://openalex.org/W3026104448","https://openalex.org/W3090027660","https://openalex.org/W3124225140","https://openalex.org/W3176912151","https://openalex.org/W3212409086","https://openalex.org/W4210870706","https://openalex.org/W4226257065","https://openalex.org/W4283819909","https://openalex.org/W4286376804","https://openalex.org/W4288347236","https://openalex.org/W6683300800","https://openalex.org/W6745935785","https://openalex.org/W6747473740","https://openalex.org/W6751629939","https://openalex.org/W6767112054","https://openalex.org/W6771312369"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W1987513656","https://openalex.org/W2072376847","https://openalex.org/W2089013912","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Decision":[0],"intelligence":[1],"based":[2],"on":[3],"reinforcement":[4,16,54],"learning":[5,55],"has":[6,146],"gained":[7],"considerable":[8],"attention.":[9],"Compared":[10],"to":[11,93,117,124,156],"the":[12,15,24,75,84,88,95,98,101,107,114,119,126,129],"rule-based":[13],"approach,":[14],"learning-based":[17],"approach":[18,56,134,145],"shows":[19],"great":[20,40],"potential":[21],"in":[22,30,63,122,149],"addressing":[23],"challenge":[25],"of":[26,35,78,97,128,151],"high":[27],"interaction.":[28],"However,":[29],"urban":[31,64],"traffic":[32,65,79,138],"scenarios,":[33,80],"decision-making":[34],"autonomous":[36],"vehicles":[37],"remains":[38],"a":[39],"challenge,":[41],"including":[42],"sample":[43,108],"efficiency":[44],"and":[45,153],"stability.":[46],"In":[47],"this":[48],"paper,":[49],"we":[50,112],"develop":[51],"an":[52],"efficient":[53],"with":[57],"advanced":[58],"features":[59],"toward":[60],"end-to-end":[61],"navigation":[62],"scenarios.":[66,139],"Firstly,":[67],"bird's-eye-view":[68],"(BEV)":[69],"semantic":[70],"segmentation":[71],"is":[72,91],"served":[73],"as":[74],"concise":[76],"representation":[77],"which":[81],"can":[82],"boost":[83],"training":[85,103],"process.":[86],"Then":[87],"expert":[89],"demonstration":[90],"applied":[92],"guide":[94],"exploration":[96],"policy":[99],"at":[100],"initial":[102],"stage,":[104],"thereby":[105],"improving":[106],"efficiency.":[109],"At":[110],"last,":[111],"employ":[113],"quantile":[115],"regression":[116],"estimate":[118],"value":[120],"distribution":[121],"order":[123],"improve":[125],"stability":[127,154],"policy.":[130],"We":[131],"validate":[132],"our":[133,144],"using":[135],"different":[136],"simulated":[137],"Experimental":[140],"results":[141],"show":[142],"that":[143],"better":[147],"performance":[148],"terms":[150],"convergence":[152],"compared":[155],"other":[157],"baselines.":[158]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
