{"id":"https://openalex.org/W4312935905","doi":"https://doi.org/10.1109/tvt.2022.3212996","title":"A Discrete Soft Actor-Critic Decision-Making Strategy With Sample Filter for Freeway Autonomous Driving","display_name":"A Discrete Soft Actor-Critic Decision-Making Strategy With Sample Filter for Freeway Autonomous Driving","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4312935905","doi":"https://doi.org/10.1109/tvt.2022.3212996"},"language":"en","primary_location":{"id":"doi:10.1109/tvt.2022.3212996","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2022.3212996","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101740669","display_name":"Jiayi Guan","orcid":"https://orcid.org/0000-0003-4097-438X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayi Guan","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100323037","display_name":"Guang Chen","orcid":"https://orcid.org/0000-0002-7416-592X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["CN","DE"],"is_corresponding":false,"raw_author_name":"Guang Chen","raw_affiliation_strings":["Tongji University, Shanghai, China","Chair of Robotics, Artificial Intelligence and Real-time Systems, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Chair of Robotics, Artificial Intelligence and Real-time Systems, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087389386","display_name":"Jin Huang","orcid":"https://orcid.org/0000-0001-8774-2936"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Huang","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450024","display_name":"Zhijun Li","orcid":"https://orcid.org/0000-0002-3909-488X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhijun Li","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100379486","display_name":"Lu Xiong","orcid":"https://orcid.org/0000-0002-1673-2658"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Xiong","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091579598","display_name":"Jing Hou","orcid":"https://orcid.org/0000-0003-4778-137X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Hou","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063781430","display_name":"Alois Knoll","orcid":"https://orcid.org/0000-0003-4840-076X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Alois Knoll","raw_affiliation_strings":["Chair of Robotics, Artificial Intelligence and Real-time Systems, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Robotics, Artificial Intelligence and Real-time Systems, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101740669"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":2.5018,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.8915855,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"72","issue":"2","first_page":"2593","last_page":"2598"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9865999817848206,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7993759512901306},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.716188907623291},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.690038800239563},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5268893241882324},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5110572576522827},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4973898231983185},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.46997588872909546},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.3876500427722931},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3203180134296417},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2895166277885437},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2382296919822693}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7993759512901306},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.716188907623291},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.690038800239563},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5268893241882324},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5110572576522827},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4973898231983185},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.46997588872909546},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3876500427722931},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3203180134296417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2895166277885437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2382296919822693},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tvt.2022.3212996","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2022.3212996","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5299999713897705,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G6371315947","display_name":null,"funder_award_id":"61906138","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320319772","display_name":"Shanghai Center for Brain Science and Brain-Inspired Technology","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2736601468","https://openalex.org/W2746553466","https://openalex.org/W2768542523","https://openalex.org/W2769471004","https://openalex.org/W2795543364","https://openalex.org/W2963625099","https://openalex.org/W2981037657","https://openalex.org/W3003760566","https://openalex.org/W3012502004","https://openalex.org/W3015082424","https://openalex.org/W3016931720","https://openalex.org/W3017247368","https://openalex.org/W3020701983","https://openalex.org/W3044345353","https://openalex.org/W3045517780","https://openalex.org/W3048976565","https://openalex.org/W3090027660","https://openalex.org/W3119746519","https://openalex.org/W3175526935","https://openalex.org/W3177061762","https://openalex.org/W3200444035","https://openalex.org/W3202375294","https://openalex.org/W3205373118","https://openalex.org/W6683300800","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6769218391","https://openalex.org/W6776534271","https://openalex.org/W6784178060"],"related_works":["https://openalex.org/W2366107444","https://openalex.org/W4388145910","https://openalex.org/W2381570729","https://openalex.org/W1976205134","https://openalex.org/W4248336175","https://openalex.org/W2031260042","https://openalex.org/W2391445434","https://openalex.org/W3009369890","https://openalex.org/W4312490297","https://openalex.org/W2062212388"],"abstract_inverted_index":{"Autonomous":[0],"driving":[1,12,32,61,108,129],"is":[2],"a":[3,44,74,160,165],"promising":[4],"technology":[5],"to":[6,59,126,189],"reduce":[7],"traffic":[8],"accidents":[9],"and":[10,31,63,87,114,121,131,138,164,186],"improve":[11,60,127],"efficiency.":[13,132],"Although":[14],"significant":[15],"progress":[16],"has":[17],"been":[18],"achieved,":[19],"existing":[20],"decision-making":[21,46,104,171],"systems":[22],"of":[23,89,96],"autonomous":[24,107],"vehicle":[25,167],"still":[26],"cannot":[27],"meet":[28],"the":[29,50,84,90,94,102,111,117,122,128,142,143,170,190],"safety":[30,64,130],"efficiency":[33,62,86,185],"requirements":[34],"in":[35,169,183],"highly":[36],"dynamic":[37],"environments.":[38],"In":[39],"this":[40],"work,":[41],"we":[42,71,100,134],"design":[43,116],"discrete":[45,51,79,103,193],"strategy":[47,105,158],"based":[48,109],"on":[49,65,110,141,173],"soft":[52,80],"actor-critic":[53],"with":[54,67],"sample":[55,75,85],"filter":[56,76],"algorithm":[57,91,178],"(DSAC-SF)":[58],"freeways":[66],"dynamics":[68],"traffic.":[69],"Specifically,":[70],"first":[72],"propose":[73],"method":[77,120],"for":[78,106],"actor-critic,":[81],"which":[82],"improves":[83],"stability":[88,187],"via":[92],"enhancing":[93],"utilization":[95],"effective":[97],"samples.":[98],"Subsequently,":[99],"construct":[101],"DSAC-SF":[112,177],"algorithm,":[113],"further":[115],"area":[118],"observation":[119],"multi-objective":[123],"reward":[124],"function":[125],"Finally,":[133],"carry":[135],"out":[136],"comparison":[137],"ablation":[139],"experiments":[140],"scalable":[144],"multi-agent":[145],"reinforcement":[146,194],"learning":[147,195],"training":[148,184],"school":[149],"(SMARTS)":[150],"simulation":[151],"environment.":[152],"Experimental":[153],"results":[154],"indicate":[155],"that":[156],"our":[157,176],"obtains":[159],"high":[161],"success":[162],"rate":[163],"fast":[166],"speed":[168],"tasks":[172],"freeways.":[174],"Moreover,":[175],"also":[179],"achieves":[180],"improved":[181],"performance":[182],"compared":[188],"commonly":[191],"used":[192],"algorithm.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":9}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
