{"id":"https://openalex.org/W4392908444","doi":"https://doi.org/10.1109/tits.2024.3368474","title":"Enhancing Car-Following Performance in Traffic Oscillations Using Expert Demonstration Reinforcement Learning","display_name":"Enhancing Car-Following Performance in Traffic Oscillations Using Expert Demonstration Reinforcement Learning","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392908444","doi":"https://doi.org/10.1109/tits.2024.3368474"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2024.3368474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2024.3368474","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027375285","display_name":"Meng Li","orcid":"https://orcid.org/0000-0001-6944-0053"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]},{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN","SG"],"is_corresponding":true,"raw_author_name":"Meng Li","raw_affiliation_strings":["School of Transportation, Southeast University, Nanjing, China","School of Mechanical and Aerospace Engineering, Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-6944-0053","affiliations":[{"raw_affiliation_string":"School of Transportation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100351555","display_name":"Zhibin Li","orcid":"https://orcid.org/0000-0001-7192-6853"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhibin Li","raw_affiliation_strings":["School of Transportation, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-7192-6853","affiliations":[{"raw_affiliation_string":"School of Transportation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007077356","display_name":"Zehong Cao","orcid":"https://orcid.org/0000-0003-3656-0328"},"institutions":[{"id":"https://openalex.org/I170239107","display_name":"University of South Australia","ror":"https://ror.org/01p93h210","country_code":"AU","type":"education","lineage":["https://openalex.org/I170239107"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Zehong Cao","raw_affiliation_strings":["STEM, University of South Australia, Adelaide, SA, Australia"],"raw_orcid":"https://orcid.org/0000-0003-3656-0328","affiliations":[{"raw_affiliation_string":"STEM, University of South Australia, Adelaide, SA, Australia","institution_ids":["https://openalex.org/I170239107"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5027375285"],"corresponding_institution_ids":["https://openalex.org/I172675005","https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":3.7863,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.93447304,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"25","issue":"7","first_page":"7751","last_page":"7766"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9635999798774719,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6658278703689575},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4871930480003357},{"id":"https://openalex.org/keywords/automotive-engineering","display_name":"Automotive engineering","score":0.42655134201049805},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3397473692893982},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.31661415100097656},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28309494256973267}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6658278703689575},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4871930480003357},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.42655134201049805},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3397473692893982},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.31661415100097656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28309494256973267}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2024.3368474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2024.3368474","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5180636669","display_name":null,"funder_award_id":"52232012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6891822477","display_name":null,"funder_award_id":"52272331","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W2046482177","https://openalex.org/W2119159364","https://openalex.org/W2152374007","https://openalex.org/W2170973929","https://openalex.org/W2515191420","https://openalex.org/W2559655401","https://openalex.org/W2612690371","https://openalex.org/W2613761153","https://openalex.org/W2736601468","https://openalex.org/W2741122588","https://openalex.org/W2744953678","https://openalex.org/W2754517384","https://openalex.org/W2761873684","https://openalex.org/W2788862220","https://openalex.org/W2912445127","https://openalex.org/W2947106284","https://openalex.org/W2963864421","https://openalex.org/W2964784128","https://openalex.org/W2976036462","https://openalex.org/W2978585366","https://openalex.org/W2981426338","https://openalex.org/W2988773531","https://openalex.org/W3017204849","https://openalex.org/W3080742113","https://openalex.org/W3090027660","https://openalex.org/W3121091948","https://openalex.org/W3127009812","https://openalex.org/W3130143314","https://openalex.org/W3153133376","https://openalex.org/W3153676008","https://openalex.org/W3169363132","https://openalex.org/W3193947369","https://openalex.org/W3200131627","https://openalex.org/W3203000071","https://openalex.org/W3210590548","https://openalex.org/W3211345831","https://openalex.org/W4205900122","https://openalex.org/W4214554111","https://openalex.org/W4214643773","https://openalex.org/W4214826322","https://openalex.org/W4220902452","https://openalex.org/W4221147127","https://openalex.org/W4226257065","https://openalex.org/W4229333161","https://openalex.org/W4236088649","https://openalex.org/W4280531426","https://openalex.org/W4281972499","https://openalex.org/W4282944694","https://openalex.org/W4286447577","https://openalex.org/W4312059601","https://openalex.org/W4312260978","https://openalex.org/W4318541446","https://openalex.org/W4367146630","https://openalex.org/W4382463422","https://openalex.org/W4391781515","https://openalex.org/W6684921986","https://openalex.org/W6717230150","https://openalex.org/W6730641667","https://openalex.org/W6741002519","https://openalex.org/W6742461812","https://openalex.org/W6793857347","https://openalex.org/W6796791731","https://openalex.org/W6810152107","https://openalex.org/W6839744550"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890","https://openalex.org/W4380318855","https://openalex.org/W2358190750"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1,51],"learning":[2,52,171],"(DRL)":[3],"algorithms":[4],"often":[5],"face":[6],"challenges":[7],"in":[8,24,32,43,157],"achieving":[9],"stability":[10],"and":[11,19,62,114,173],"efficiency":[12],"due":[13],"to":[14,57,70,80,176],"significant":[15],"policy":[16],"gradient":[17],"variance":[18],"inaccurate":[20],"reward":[21],"function":[22],"estimation":[23],"complex":[25],"scenarios.":[26],"This":[27],"study":[28],"addresses":[29],"these":[30],"issues":[31],"the":[33,82,92,119,130,134,146,150],"context":[34],"of":[35],"multi-objective":[36],"car-following":[37,64,77,108,116,135],"control":[38,78],"tasks":[39],"with":[40,133],"time":[41],"lag":[42],"traffic":[44,105,159],"oscillations.":[45],"We":[46],"propose":[47],"an":[48,111],"expert":[49,72,95,122,147],"demonstration":[50],"(EDRL)":[53],"approach":[54],"that":[55,163],"aims":[56],"stabilize":[58],"training,":[59,128],"accelerate":[60],"learning,":[61],"enhance":[63],"performance.":[65],"The":[66,137],"key":[67],"idea":[68],"is":[69],"leverage":[71],"demonstrations,":[73],"which":[74],"represent":[75],"superior":[76],"experiences,":[79],"improve":[81],"DRL":[83],"policy.":[84],"Our":[85],"method":[86,166],"involves":[87],"two":[88],"sequential":[89],"steps.":[90],"In":[91,118],"first":[93],"step,":[94,121],"demonstrations":[96,123,148],"are":[97,124,140],"obtained":[98,125],"during":[99,126],"offline":[100],"pretraining":[101],"by":[102],"utilizing":[103],"prior":[104],"knowledge,":[106],"including":[107],"trajectories":[109],"from":[110],"empirical":[112],"database":[113],"classic":[115],"models.":[117],"second":[120],"online":[127],"where":[129],"agent":[131],"interacts":[132],"environment.":[136],"EDRL":[138],"agents":[139],"trained":[141],"through":[142],"supervised":[143],"regression":[144],"on":[145],"using":[149],"behavioral":[151],"cloning":[152],"technique.":[153],"Experimental":[154],"results":[155],"conducted":[156],"various":[158],"oscillation":[160],"scenarios":[161],"demonstrate":[162],"our":[164],"proposed":[165],"significantly":[167],"enhances":[168],"training":[169],"stability,":[170],"speed,":[172],"rewards":[174],"compared":[175],"baseline":[177],"algorithms.":[178]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
