{"id":"https://openalex.org/W7139022155","doi":"https://doi.org/10.1145/3788149.3788204","title":"Nonholonomic Narrow Dead-End Escape with Deep Reinforcement Learning","display_name":"Nonholonomic Narrow Dead-End Escape with Deep Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-12","ids":{"openalex":"https://openalex.org/W7139022155","doi":"https://doi.org/10.1145/3788149.3788204"},"language":null,"primary_location":{"id":"doi:10.1145/3788149.3788204","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788149.3788204","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 9th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3788149.3788204","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Denghan Xiong","orcid":"https://orcid.org/0009-0003-0657-1787"},"institutions":[{"id":"https://openalex.org/I4210092870","display_name":"Jiaxing University","ror":"https://ror.org/00j2a7k55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210092870"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Denghan Xiong","raw_affiliation_strings":["Zhejiang University, Jiaxing, Zhejiang, China"],"raw_orcid":"https://orcid.org/0009-0003-0657-1787","affiliations":[{"raw_affiliation_string":"Zhejiang University, Jiaxing, Zhejiang, China","institution_ids":["https://openalex.org/I4210092870"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yanzhe Zhao","orcid":"https://orcid.org/0009-0003-5342-6611"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanzhe Zhao","raw_affiliation_strings":["Tianjin University, Tianjin, Tianjin, China"],"raw_orcid":"https://orcid.org/0009-0003-5342-6611","affiliations":[{"raw_affiliation_string":"Tianjin University, Tianjin, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yutong Chen","orcid":"https://orcid.org/0009-0004-9202-1673"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong Chen","raw_affiliation_strings":["Beijing Jiao Tong University, Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-9202-1673","affiliations":[{"raw_affiliation_string":"Beijing Jiao Tong University, Beijing, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129856448","display_name":"Zichun Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I13591777","display_name":"University of Nottingham Ningbo China","ror":"https://ror.org/03y4dt428","country_code":"CN","type":"education","lineage":["https://openalex.org/I13591777","https://openalex.org/I142263535"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zichun Wang","raw_affiliation_strings":["University of Nottingham Ningbo China, Ningbo, Zhejiang, China"],"raw_orcid":"https://orcid.org/0009-0005-7596-1353","affiliations":[{"raw_affiliation_string":"University of Nottingham Ningbo China, Ningbo, Zhejiang, China","institution_ids":["https://openalex.org/I13591777"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210092870"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70890076,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"126","last_page":"131"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11615","display_name":"Control and Dynamics of Mobile Robots","score":0.5806999802589417,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11615","display_name":"Control and Dynamics of Mobile Robots","score":0.5806999802589417,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.13490000367164612,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.037700001150369644,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5705999732017517},{"id":"https://openalex.org/keywords/nonholonomic-system","display_name":"Nonholonomic system","score":0.41589999198913574},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.3425999879837036},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.3334999978542328},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.3190999925136566},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.30320000648498535}],"concepts":[{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5705999732017517},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5077999830245972},{"id":"https://openalex.org/C138632511","wikidata":"https://www.wikidata.org/wiki/Q2478109","display_name":"Nonholonomic system","level":4,"score":0.41589999198913574},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35910001397132874},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3425999879837036},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3190999925136566},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.30320000648498535},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2944999933242798},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2930000126361847},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.29170000553131104},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2759000062942505},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.25839999318122864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3788149.3788204","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788149.3788204","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 9th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3788149.3788204","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788149.3788204","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 9th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.4616279900074005}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1633338931","https://openalex.org/W1969483458","https://openalex.org/W1971998222","https://openalex.org/W2122724557","https://openalex.org/W2148970883","https://openalex.org/W2963428623","https://openalex.org/W3158253560","https://openalex.org/W3203686546","https://openalex.org/W3206426202","https://openalex.org/W3208979922","https://openalex.org/W4284714030","https://openalex.org/W4285685133","https://openalex.org/W4327522515","https://openalex.org/W4387880310","https://openalex.org/W4416083998","https://openalex.org/W4417050645"],"related_works":[],"abstract_inverted_index":{"Nonholonomic":[0],"constraints":[1,137],"restrict":[2],"feasible":[3,126],"velocities":[4],"without":[5],"reducing":[6],"configuration-space":[7],"dimension,":[8],"which":[9,71],"makes":[10],"collision-free":[11],"geometric":[12],"paths":[13],"generally":[14],"non-executable":[15],"for":[16,86],"car-like":[17],"robots.":[18],"Ackermann":[19,87,105],"steering":[20,51],"further":[21],"imposes":[22],"curvature":[23],"bounds":[24],"and":[25,40,49,62,75,89,107,138,177,182,190],"forbids":[26],"in-place":[27],"rotation,":[28],"so":[29],"escaping":[30],"from":[31],"narrow":[32,57,83,115],"dead":[33,116],"ends":[34,117],"typically":[35],"requires":[36],"tightly":[37],"sequenced":[38],"forward":[39],"reverse":[41],"maneuvers.":[42],"Classical":[43],"planners":[44,153],"that":[45,98,118,134,154],"decouple":[46],"global":[47,156],"search":[48,157],"local":[50],"struggle":[52],"in":[53],"these":[54],"settings":[55],"because":[56],"passages":[58],"occupy":[59],"low-measure":[60],"regions":[61],"nonholonomic":[63,82,159],"reachability":[64],"shrinks":[65],"the":[66,143,165,187],"set":[67],"of":[68,114,172],"valid":[69],"connections,":[70],"degrades":[72],"sampling":[73],"efficiency":[74],"increases":[76],"sensitivity":[77],"to":[78,111,121],"clearances.":[79],"We":[80,193],"study":[81],"dead-end":[84,163],"escape":[85],"vehicles":[88],"contribute":[90],"three":[91],"components.":[92],"First,":[93],"we":[94,129,148],"construct":[95,130],"a":[96,131,140,169],"generator":[97],"samples":[99],"multi-phase":[100],"forward\u2013reverse":[101],"trajectories":[102],"compatible":[103],"with":[104,158],"kinematics":[106],"inflates":[108],"their":[109],"envelopes":[110],"synthesize":[112],"families":[113],"are":[119],"guaranteed":[120],"admit":[122],"at":[123],"least":[124],"one":[125],"escape.":[127],"Second,":[128],"training":[132],"environment":[133],"enforces":[135],"kinematic":[136],"train":[139],"policy":[141,167],"using":[142],"soft":[144],"actor-critic":[145],"algorithm.":[146],"Third,":[147],"evaluate":[149],"against":[150],"representative":[151],"classical":[152],"combine":[155],"steering.":[160],"Across":[161],"parameterized":[162],"families,":[164],"learned":[166],"solves":[168],"larger":[170],"fraction":[171],"instances,":[173],"reduces":[174],"maneuver":[175],"count,":[176],"maintains":[178],"comparable":[179],"path":[180],"length":[181],"planning":[183],"time":[184],"while":[185],"under":[186],"same":[188],"sensing":[189],"control":[191],"limits.":[192],"provide":[194],"our":[195],"project":[196],"as":[197],"an":[198],"open":[199],"source":[200],"on":[201],"https://github.com/gitagitty/cisDRL-RobotNav.git":[202]},"counts_by_year":[],"updated_date":"2026-03-21T06:30:42.041108","created_date":"2026-03-20T00:00:00"}
