{"id":"https://openalex.org/W4391305615","doi":"https://doi.org/10.1109/tase.2023.3347264","title":"Socially Intelligent Reinforcement Learning for Optimal Automated Vehicle Control in Traffic Scenarios","display_name":"Socially Intelligent Reinforcement Learning for Optimal Automated Vehicle Control in Traffic Scenarios","publication_year":2024,"publication_date":"2024-01-29","ids":{"openalex":"https://openalex.org/W4391305615","doi":"https://doi.org/10.1109/tase.2023.3347264"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2023.3347264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2023.3347264","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072145212","display_name":"Hamid Taghavifar","orcid":"https://orcid.org/0000-0002-2407-8393"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Hamid Taghavifar","raw_affiliation_strings":["Department of Mechanical, Industrial and Aerospace Engineering, Concordia University, Montreal, QC, Canada","Department of Mechanical, Industrial and Aerospace Engineering, Concordia University, Montreal, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical, Industrial and Aerospace Engineering, Concordia University, Montreal, QC, Canada","institution_ids":["https://openalex.org/I60158472"]},{"raw_affiliation_string":"Department of Mechanical, Industrial and Aerospace Engineering, Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054213642","display_name":"Chongfeng Wei","orcid":"https://orcid.org/0000-0002-4565-509X"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chongfeng Wei","raw_affiliation_strings":["School of Mechanical and Aerospace Engineering, Queen&#x2019;s University Belfast, Belfast, U.K"],"affiliations":[{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Queen&#x2019;s University Belfast, Belfast, U.K","institution_ids":["https://openalex.org/I126231945"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083976283","display_name":"Leyla Taghavifar","orcid":"https://orcid.org/0009-0004-5130-4781"},"institutions":[{"id":"https://openalex.org/I110525433","display_name":"Islamic Azad University, Tehran","ror":"https://ror.org/01kzn7k21","country_code":"IR","type":"education","lineage":["https://openalex.org/I110525433"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Leyla Taghavifar","raw_affiliation_strings":["School of Electrical and Electronics Engineering, Islamic Azad University (IAU), Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Electronics Engineering, Islamic Azad University (IAU), Tehran, Iran","institution_ids":["https://openalex.org/I110525433"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072145212"],"corresponding_institution_ids":["https://openalex.org/I60158472"],"apc_list":null,"apc_paid":null,"fwci":7.2259,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.97600903,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"22","issue":null,"first_page":"129","last_page":"140"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9610000252723694,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9610000252723694,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7769703269004822},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5442904829978943},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5126523375511169},{"id":"https://openalex.org/keywords/intelligent-transportation-system","display_name":"Intelligent transportation system","score":0.44385066628456116},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.4143292307853699},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4138481616973877},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4118836522102356},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33884671330451965},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.3060630261898041}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7769703269004822},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5442904829978943},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5126523375511169},{"id":"https://openalex.org/C47796450","wikidata":"https://www.wikidata.org/wiki/Q508378","display_name":"Intelligent transportation system","level":2,"score":0.44385066628456116},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.4143292307853699},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4138481616973877},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4118836522102356},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33884671330451965},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.3060630261898041},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2023.3347264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2023.3347264","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3825813119","display_name":null,"funder_award_id":"100010636","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2082585576","https://openalex.org/W2145339207","https://openalex.org/W2583993537","https://openalex.org/W2802205534","https://openalex.org/W2909906617","https://openalex.org/W2926065969","https://openalex.org/W2963135764","https://openalex.org/W3088333196","https://openalex.org/W3104608980","https://openalex.org/W3127561923","https://openalex.org/W3128640023","https://openalex.org/W3149568784","https://openalex.org/W3169261419","https://openalex.org/W3175299701","https://openalex.org/W3176187537","https://openalex.org/W3189363471","https://openalex.org/W3194730353","https://openalex.org/W3209247505","https://openalex.org/W4210405825","https://openalex.org/W4280556607","https://openalex.org/W4285049144","https://openalex.org/W4285240001","https://openalex.org/W4285489769","https://openalex.org/W4308068344","https://openalex.org/W4312235890","https://openalex.org/W4312570569","https://openalex.org/W4313645995","https://openalex.org/W4316193296","https://openalex.org/W4319835989","https://openalex.org/W4319997953","https://openalex.org/W4389266945","https://openalex.org/W6767604493"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2089013912","https://openalex.org/W2107890255","https://openalex.org/W2076061571","https://openalex.org/W2106552856","https://openalex.org/W1987513656","https://openalex.org/W2072376847"],"abstract_inverted_index":{"In":[0],"this":[1,247],"paper,":[2],"a":[3,18,21,25,32,65,90,99,187,274,299,354,377],"novel":[4,244],"approach":[5,125,346,381],"is":[6,69,102,164,199,278,347],"presented":[7],"for":[8,50,207,259],"modeling":[9],"the":[10,42,47,51,59,73,77,81,84,105,109,112,116,121,131,145,149,160,167,172,202,220,251,256,260,268,282,286,290,293,325,369,385],"interaction":[11],"dynamics":[12],"between":[13,93,136,302],"an":[14],"ego":[15,52,78,132,261,287],"car":[16,79,133,288],"and":[17,80,95,140,162,176,215,289,304,315,318,331,338,379,387],"bicycle":[19],"in":[20,104,159,186,210,349],"traffic":[22,217],"scenario":[23],"using":[24],"hybrid":[26],"reinforcement":[27],"learning":[28,117],"framework":[29,40,106,198,245,321],"combined":[30],"with":[31,183,236,360],"social":[33,74,146,283],"value":[34],"orientation":[35],"(SVO)":[36],"model.":[37],"The":[38,151,342],"proposed":[39,168,197],"leverages":[41],"SARSA":[43,252],"algorithm":[44,253],"to":[45,71,107,156,171,194,254,280,311,334,352],"learn":[46,255],"optimal":[48,257],"policy":[49,258],"vehicle":[53,262,329],"while":[54,143,263],"incorporating":[55,264],"risk":[56,265],"cost":[57,266],"as":[58,89,267,298],"negative":[60,269],"log-likelihood":[61,270],"of":[62,76,86,111,123,148,174,205,223,271,285,295,327,344,356,371,390],"collision.":[63,272],"Additionally,":[64,273],"customized":[66,275],"SVO":[67,85,113,276,294],"model":[68,114,277],"introduced":[70,279],"capture":[72,281],"preferences":[75,147,284],"bicycle,":[82,291],"defining":[83,292],"each":[87,296],"agent":[88,297],"continuous":[91,300],"variable":[92,301],"egoistic":[94,303],"cooperative":[96,305],"orientations.":[97,306],"Furthermore,":[98],"weight":[100],"parameter":[101],"incorporated":[103],"regulate":[108],"influence":[110],"on":[115,226],"process.":[118],"We":[119],"demonstrate":[120],"effectiveness":[122],"our":[124,345,374],"through":[126],"extensive":[127],"simulations,":[128],"showing":[129],"that":[130,166,181,232,382],"can":[134,233,322,383],"balance":[135],"maximizing":[137],"its":[138,350],"reward":[139],"avoiding":[141],"collisions":[142],"considering":[144],"agents.":[150],"obtained":[152],"results":[153],"are":[154],"compared":[155],"other":[157,237],"models":[158],"literature,":[161],"it":[163],"shown":[165],"method":[169],"contributes":[170],"development":[173],"safe":[175],"efficient":[177],"autonomous":[178,208,224,309,328,357],"driving":[179,213,392],"systems":[180,231],"interact":[182,235],"human-driven":[184],"vehicles":[185,225,310,358],"socially":[188],"intelligent":[189,229],"manner":[190],"<italic":[191],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[192],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Note":[193],"Practitioners</i>":[195],"\u2014This":[196],"motivated":[200],"by":[201,249],"pressing":[203],"challenge":[204],"navigation":[206,230,330],"cars":[209],"complex":[211],"urban":[212,391],"scenarios":[214],"mixed":[216],"situations.":[218],"With":[219],"increasing":[221],"prevalence":[222],"roads,":[227],"developing":[228,335],"effectively":[234],"road":[238,362],"users":[239],"has":[240],"become":[241],"essential.":[242],"Our":[243,320],"addresses":[246],"need":[248],"leveraging":[250,368],"This":[307],"enables":[308],"make":[312],"informed":[313],"decisions":[314],"navigate":[316],"safely":[317],"efficiently.":[319],"enormously":[323],"help":[324],"field":[326],"contribute":[332],"significantly":[333],"safe,":[336],"human-centric,":[337],"reliable":[339],"transportation":[340],"systems.":[341],"versatility":[343],"evident":[348],"potential":[351],"support":[353],"network":[355],"interacting":[359],"multiple":[361],"users,":[363],"thereby":[364],"enhancing":[365],"scalability.":[366],"By":[367],"power":[370],"machine":[372],"learning,":[373],"solution":[375],"provides":[376],"robust":[378],"adaptable":[380],"handle":[384],"diverse":[386],"ever-changing":[388],"conditions":[389],"scenarios.":[393]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":10}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
