{"id":"https://openalex.org/W4405429419","doi":"https://doi.org/10.1109/lra.2024.3518839","title":"Distributional Reinforcement Learning Based Integrated Decision Making and Control for Autonomous Surface Vehicles","display_name":"Distributional Reinforcement Learning Based Integrated Decision Making and Control for Autonomous Surface Vehicles","publication_year":2024,"publication_date":"2024-12-16","ids":{"openalex":"https://openalex.org/W4405429419","doi":"https://doi.org/10.1109/lra.2024.3518839"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2024.3518839","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3518839","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100450524","display_name":"Lin Xi","orcid":"https://orcid.org/0000-0003-0118-7391"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xi Lin","raw_affiliation_strings":["Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA"],"raw_orcid":"https://orcid.org/0000-0003-0118-7391","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060201714","display_name":"Paul Szenher","orcid":"https://orcid.org/0009-0009-3835-5433"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul Szenher","raw_affiliation_strings":["Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA"],"raw_orcid":"https://orcid.org/0009-0009-3835-5433","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016931059","display_name":"Yewei Huang","orcid":"https://orcid.org/0000-0002-2505-6022"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yewei Huang","raw_affiliation_strings":["Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA"],"raw_orcid":"https://orcid.org/0000-0002-2505-6022","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044251670","display_name":"Brendan Englot","orcid":"https://orcid.org/0000-0002-7966-2917"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brendan Englot","raw_affiliation_strings":["Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA"],"raw_orcid":"https://orcid.org/0000-0002-7966-2917","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.4565,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.830056,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"10","issue":"2","first_page":"1194","last_page":"1201"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.6115999817848206,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.6115999817848206,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.5508999824523926,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5454999804496765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8203480243682861},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5609405040740967},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5213607549667358},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5027801990509033},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37555328011512756},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.28945839405059814}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8203480243682861},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5609405040740967},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5213607549667358},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5027801990509033},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37555328011512756},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28945839405059814},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2024.3518839","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3518839","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6899999976158142,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G6550789113","display_name":null,"funder_award_id":"N00014-24-1-2522","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G8534626878","display_name":null,"funder_award_id":"N00014-20-1-2570","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2074547849","https://openalex.org/W2145339207","https://openalex.org/W2492811885","https://openalex.org/W2547705816","https://openalex.org/W2565029242","https://openalex.org/W2761873684","https://openalex.org/W2790472381","https://openalex.org/W2891998162","https://openalex.org/W2954211265","https://openalex.org/W2973229164","https://openalex.org/W2979089101","https://openalex.org/W3001711064","https://openalex.org/W3015082424","https://openalex.org/W3019349330","https://openalex.org/W3083914918","https://openalex.org/W3094040002","https://openalex.org/W3128019105","https://openalex.org/W3174645049","https://openalex.org/W3215237054","https://openalex.org/W3217527643","https://openalex.org/W4303712354","https://openalex.org/W4312268189","https://openalex.org/W4322729780","https://openalex.org/W4393404806","https://openalex.org/W4401417420","https://openalex.org/W6683300800","https://openalex.org/W6747473740","https://openalex.org/W6750645735","https://openalex.org/W6751629939","https://openalex.org/W6773161478","https://openalex.org/W6798240405"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856"],"abstract_inverted_index":{"With":[0],"the":[1,12,28,65,68,112,135],"growing":[2],"demands":[3],"for":[4,18,36,71],"Autonomous":[5],"Surface":[6],"Vehicles":[7],"(ASVs)":[8],"in":[9,27,43,63,105,115,141],"recent":[10],"years,":[11],"number":[13],"of":[14,111],"ASVs":[15,37],"being":[16],"deployed":[17],"various":[19],"maritime":[20],"missions":[21],"is":[22,33],"expected":[23],"to":[24,38,100,122,125,147],"increase":[25],"rapidly":[26],"near":[29,58],"future.":[30],"However,":[31],"it":[32],"still":[34],"challenging":[35],"perform":[39],"sensor-based":[40],"autonomous":[41],"navigation":[42,89,142],"obstacle-filled":[44],"and":[45,54,97,144,155],"congested":[46],"waterways,":[47],"where":[48],"perception":[49],"errors,":[50],"closely":[51],"gathered":[52],"vehicles":[53],"limited":[55],"maneuvering":[56],"space":[57],"buoys":[59],"may":[60],"cause":[61],"difficulties":[62],"following":[64],"Convention":[66],"on":[67,134],"International":[69],"Regulations":[70],"Preventing":[72],"Collisions":[73],"at":[74],"Sea":[75],"(COLREGs).":[76],"To":[77],"address":[78],"these":[79],"issues,":[80],"we":[81],"propose":[82],"a":[83],"novel":[84],"Distributional":[85,151],"Reinforcement":[86],"Learning":[87],"based":[88,133],"system":[90,114],"that":[91],"can":[92],"work":[93],"with":[94],"onboard":[95],"LiDAR":[96],"odometry":[98],"sensors":[99],"generate":[101],"arbitrary":[102],"thrust":[103],"commands":[104],"continuous":[106],"action":[107],"space.":[108],"Comprehensive":[109],"evaluations":[110],"proposed":[113],"high-fidelity":[116],"Gazebo":[117],"simulations":[118],"show":[119],"its":[120],"ability":[121],"decide":[123],"whether":[124],"follow":[126],"COLREGs":[127],"or":[128],"take":[129],"other":[130],"beneficial":[131],"actions":[132],"scenarios":[136],"encountered,":[137],"offering":[138],"superior":[139],"performance":[140],"safety":[143],"efficiency":[145],"compared":[146],"systems":[148],"using":[149],"state-of-the-art":[150],"RL,":[152],"non-Distributional":[153],"RL":[154],"classical":[156],"methods.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
