{"id":"https://openalex.org/W4391768774","doi":"https://doi.org/10.1109/itsc57777.2023.10422486","title":"Temporal Based Deep Reinforcement Learning for Crowded Lane Merging Maneuvers","display_name":"Temporal Based Deep Reinforcement Learning for Crowded Lane Merging Maneuvers","publication_year":2023,"publication_date":"2023-09-24","ids":{"openalex":"https://openalex.org/W4391768774","doi":"https://doi.org/10.1109/itsc57777.2023.10422486"},"language":"en","primary_location":{"id":"doi:10.1109/itsc57777.2023.10422486","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/itsc57777.2023.10422486","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111128670","display_name":"Luis Miguel Mart\u00ednez G\u00f3mez","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Luis Miguel Mart\u00ednez G\u00f3mez","raw_affiliation_strings":["University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805"],"affiliations":[{"raw_affiliation_string":"University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051151484","display_name":"Iv\u00e1n Garc\u00eda Daza","orcid":"https://orcid.org/0000-0001-8940-6434"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Iv\u00e1n Garc\u00eda Daza","raw_affiliation_strings":["University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805"],"affiliations":[{"raw_affiliation_string":"University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048485743","display_name":"Miguel A. V\u00e1zquez","orcid":"https://orcid.org/0009-0003-5435-8323"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miguel \u00c1ngel Sotelo V\u00e1zquez","raw_affiliation_strings":["University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805"],"affiliations":[{"raw_affiliation_string":"University of Alcal&#x00E1;,Computer Engineering Department,Spain,28805","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5111128670"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.25854181,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"abs/1610.03295","issue":null,"first_page":"2764","last_page":"2769"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10805","display_name":"Vehicle Dynamics and Control Systems","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8130625486373901},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7547863125801086},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5932190418243408},{"id":"https://openalex.org/keywords/temporal-difference-learning","display_name":"Temporal difference learning","score":0.41035011410713196},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.38097262382507324}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8130625486373901},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7547863125801086},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5932190418243408},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.41035011410713196},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38097262382507324}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/itsc57777.2023.10422486","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/itsc57777.2023.10422486","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1977565586","https://openalex.org/W2103328396","https://openalex.org/W2583993537","https://openalex.org/W2736601468","https://openalex.org/W2794786585","https://openalex.org/W2919912236","https://openalex.org/W2962977206","https://openalex.org/W2963322416","https://openalex.org/W2963625099","https://openalex.org/W2989730386","https://openalex.org/W3100944043","https://openalex.org/W3120624913","https://openalex.org/W3176912151","https://openalex.org/W3208191353","https://openalex.org/W4286253093","https://openalex.org/W4301501993","https://openalex.org/W6728155968","https://openalex.org/W6741002519","https://openalex.org/W6745935785","https://openalex.org/W6747473740","https://openalex.org/W6748839928","https://openalex.org/W6749650931","https://openalex.org/W6793108136","https://openalex.org/W6804601995"],"related_works":["https://openalex.org/W2755342338","https://openalex.org/W2058170566","https://openalex.org/W2036807459","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W1969923398","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2079911747"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,23,38,65,98,139],"joint":[6],"behavior":[7,79],"and":[8,45,104,115,143],"motion":[9],"planning":[10],"agent":[11,28,57,91,137],"based":[12],"on":[13],"DRL":[14],"(Deep":[15],"Reinforcement":[16],"Learning)":[17],"intended":[18],"for":[19],"automated":[20],"vehicles":[21,83],"in":[22,52,84,88,110],"crowded":[24],"merging":[25,94],"scenario.":[26],"The":[27],"is":[29],"trained":[30],"using":[31,68],"the":[32,53,69,78,85,90,93,127,145,152],"PPO":[33],"(Proximal":[34],"Policy":[35],"Optimization)":[36],"algorithm,":[37],"state-of-the-art":[39],"solution":[40],"that":[41,134],"ensures":[42],"training":[43],"stability":[44],"sample":[46],"efficiency.":[47],"We":[48,62,96,117],"include":[49],"temporal":[50,102],"information":[51],"observation":[54],"of":[55,80,112,122,147],"our":[56,101,135],"to":[58,73,125],"improve":[59],"system":[60],"stability.":[61],"have":[63],"defined":[64],"simulated":[66,86],"environment":[67],"CARLA":[70],"(Car":[71],"Learning":[72],"Act)":[74],"simulator,":[75],"which":[76,89],"handles":[77],"all":[81],"other":[82],"world,":[87],"performs":[92],"maneuver.":[95],"perform":[97],"comparison":[99],"between":[100,130],"approach":[103],"an":[105],"established,":[106],"distance-based":[107],"one,":[108],"both":[109,123,149],"terms":[111],"safety,":[113],"smoothness":[114],"comfort.":[116],"further":[118],"analyze":[119],"specific":[120],"examples":[121],"systems":[124,150],"describe":[126],"performance":[128],"differences":[129],"them.":[131],"Results":[132],"show":[133],"proposed":[136],"yields":[138],"smoother,":[140],"safer":[141],"experience,":[142],"prove":[144],"viability":[146],"interweaving":[148],"within":[151],"same":[153],"agent.":[154]},"counts_by_year":[],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
