{"id":"https://openalex.org/W4389319185","doi":"https://doi.org/10.1109/tase.2023.3337230","title":"A Long-Term Actor Network for Human-Like Car-Following Trajectory Planning Guided by Offline Sample-Based Deep Inverse Reinforcement Learning","display_name":"A Long-Term Actor Network for Human-Like Car-Following Trajectory Planning Guided by Offline Sample-Based Deep Inverse Reinforcement Learning","publication_year":2023,"publication_date":"2023-12-04","ids":{"openalex":"https://openalex.org/W4389319185","doi":"https://doi.org/10.1109/tase.2023.3337230"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2023.3337230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2023.3337230","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019242097","display_name":"Jiangfeng Nan","orcid":"https://orcid.org/0000-0003-2126-1210"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiangfeng Nan","raw_affiliation_strings":["School of Transportation Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Transportation Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113724748","display_name":"Weiwen Deng","orcid":"https://orcid.org/0000-0002-3736-9368"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiwen Deng","raw_affiliation_strings":["School of Transportation Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Transportation Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043023460","display_name":"Ruzheng Zhang","orcid":"https://orcid.org/0000-0002-0479-2792"},"institutions":[{"id":"https://openalex.org/I4401726824","display_name":"Horizon Robotics (China)","ror":"https://ror.org/05cmv6g68","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726824"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruzheng Zhang","raw_affiliation_strings":["Horizon Robotics, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Horizon Robotics, Beijing, China","institution_ids":["https://openalex.org/I4401726824"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100628921","display_name":"Ying Wang","orcid":"https://orcid.org/0000-0002-1121-4712"},"institutions":[{"id":"https://openalex.org/I4210134929","display_name":"Jilin Province Science and Technology Department","ror":"https://ror.org/049x38272","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210134929"]},{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Wang","raw_affiliation_strings":["College of Computer Science and Technology, Jilin University, Jilin, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Jilin University, Jilin, China","institution_ids":["https://openalex.org/I4210134929","https://openalex.org/I194450716"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101847348","display_name":"Juan Ding","orcid":"https://orcid.org/0009-0009-1838-9708"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Juan Ding","raw_affiliation_strings":["PanoSim Technology Company Ltd., Jiaxing, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"PanoSim Technology Company Ltd., Jiaxing, Zhejiang, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5019242097"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":1.1172,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.78576439,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"21","issue":"4","first_page":"7094","last_page":"7106"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12095","display_name":"Vehicle emissions and performance","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7301455736160278},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6117448806762695},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5936858654022217},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5171415209770203},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5143817067146301},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4542830288410187},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4497494697570801}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7301455736160278},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6117448806762695},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5936858654022217},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5171415209770203},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5143817067146301},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4542830288410187},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4497494697570801},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2023.3337230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2023.3337230","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6505405042","display_name":null,"funder_award_id":"U1864201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W643528169","https://openalex.org/W1527702126","https://openalex.org/W1573205248","https://openalex.org/W1965455100","https://openalex.org/W2005071617","https://openalex.org/W2047688790","https://openalex.org/W2071969188","https://openalex.org/W2097645351","https://openalex.org/W2098955201","https://openalex.org/W2124298315","https://openalex.org/W2135956515","https://openalex.org/W2268044283","https://openalex.org/W2342840547","https://openalex.org/W2487175822","https://openalex.org/W2744369598","https://openalex.org/W2755552418","https://openalex.org/W2886622679","https://openalex.org/W2891385160","https://openalex.org/W2904814783","https://openalex.org/W2963165400","https://openalex.org/W2963787234","https://openalex.org/W3003329097","https://openalex.org/W3005781127","https://openalex.org/W3037606473","https://openalex.org/W3091165146","https://openalex.org/W3093456443","https://openalex.org/W3106187129","https://openalex.org/W3107293915","https://openalex.org/W3117223116","https://openalex.org/W3120649473","https://openalex.org/W3154384271","https://openalex.org/W3176912151","https://openalex.org/W3202432377","https://openalex.org/W4285047693","https://openalex.org/W4294292690","https://openalex.org/W4295046628","https://openalex.org/W4295248387","https://openalex.org/W4385268955","https://openalex.org/W6620991601","https://openalex.org/W6674884181","https://openalex.org/W6684338915","https://openalex.org/W6704559304","https://openalex.org/W6769297746","https://openalex.org/W6802142037"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W1941703695","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W3131574667","https://openalex.org/W2586732548","https://openalex.org/W4323768008"],"abstract_inverted_index":{"Human-like":[0],"autonomous":[1,217],"driving":[2,46,53,65,96,218,236,262,270],"can":[3,219],"enhance":[4,68,220],"user":[5,221],"acceptance":[6,222],"and":[7,207,223,337],"integration":[8,224],"within":[9,225],"traffic.":[10,226],"In":[11],"light":[12],"of":[13,94,155,247],"this,":[14],"this":[15,128,131,289],"paper":[16,132,228,290],"presents":[17],"a":[18,134,230,274,292],"planning":[19,182,231,312],"method":[20,42,187,232,253,317],"for":[21,71,101,233],"the":[22,40,57,69,73,91,105,149,159,171,181,185,195,198,203,252,255,303,311,315,325,328,333],"human-like":[23,234],"longitudinal":[24],"trajectory":[25],"in":[26,108,168],"car-following":[27,235],"scenarios":[28,116,279],"with":[29,127],"offline":[30,239],"sample-based":[31,240],"maximum":[32],"entropy":[33],"deep":[34,79,241],"inverse":[35,122,242,285],"reinforcement":[36,123,243,286],"learning":[37,124,244],"(DIRL).":[38,245],"Specifically,":[39],"proposed":[41,186,204,316,334],"doesn\u2019t":[43],"mimic":[44],"human":[45,74,191,249,321],"behavior":[47,193,323],"directly.":[48],"Instead,":[49],"it":[50,99],"uses":[51],"naturalistic":[52,95,269],"data":[54,97],"to":[55,63,82,103,125,158,170,190,214,260,301,320],"learn":[56],"internal":[58,256],"reward":[59,75,106,141,160,257,299],"function":[60,107,258],"that":[61,180,310],"leads":[62],"these":[64,261],"behaviors.":[66,263],"To":[67,264],"capacity":[70],"fitting":[72],"function,":[76],"DIRL":[77,102],"leverages":[78],"neural":[80],"networks":[81],"replace":[83],"linear":[84],"functions":[85],"used":[86],"by":[87,119,139,152,268,282,297],"traditional":[88,172],"IRL.":[89],"However,":[90],"long-tail":[92,272],"effect":[93],"makes":[98],"challenging":[100],"capture":[104],"edge":[109,115,278],"scenarios.":[110],"A":[111],"simulated":[112,275],"dataset":[113,276],"covering":[114,277],"is":[117,280],"collected":[118,281],"employing":[120,283],"feature-based":[121,284],"deal":[126],"challenge.":[129],"Furthermore,":[130],"trains":[133,291],"long-term":[135,144,293],"actor":[136,145,174,294],"network":[137,146,295,300],"guided":[138,296],"DIRL\u2019s":[140,298],"network.":[142,175],"The":[143,176,306],"significantly":[147],"reduces":[148],"computation":[150,304],"cost":[151],"three":[153],"orders":[154],"magnitude":[156],"compared":[157],"network-based":[161],"method,":[162],"while":[163],"also":[164],"avoiding":[165],"system":[166],"oscillation":[167],"contrast":[169],"one-step":[173],"simulation":[177,307],"experiments":[178,308],"confirm":[179,309],"results":[183,201,313,331],"from":[184,314],"are":[188,318],"closer":[189,319],"drivers\u2019":[192,322],"than":[194,324],"baseline.":[196,326],"And,":[197,327],"hardware-in-the-loop":[199,329],"experiment":[200,330],"affirm":[202,332],"method\u2019s":[205,335],"effectiveness":[206,336],"good":[208,338],"real-time":[209,339],"performance.":[210,340],"<italic":[211],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[212],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Note":[213],"Practitioners</i>":[215],"\u2014Human-like":[216],"This":[227],"proposes":[229],"behaviors":[237],"using":[238],"Instead":[246],"mimicking":[248],"trajectories":[250],"directly,":[251],"learns":[254],"leading":[259],"address":[265],"challenges":[266],"posed":[267],"data\u2019s":[271],"effect,":[273],"learning.":[287],"Additionally,":[288],"reduce":[302],"cost.":[305]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
