{"id":"https://openalex.org/W4416944577","doi":"https://doi.org/10.48550/arxiv.2511.22338","title":"Nonholonomic Narrow Dead-End Escape with Deep Reinforcement Learning","display_name":"Nonholonomic Narrow Dead-End Escape with Deep Reinforcement Learning","publication_year":2025,"publication_date":"2025-11-27","ids":{"openalex":"https://openalex.org/W4416944577","doi":"https://doi.org/10.48550/arxiv.2511.22338"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.22338","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.22338","pdf_url":"https://arxiv.org/pdf/2511.22338","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2511.22338","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101431184","display_name":"Dan Xiong","orcid":"https://orcid.org/0000-0001-7441-8336"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xiong, Denghan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003158162","display_name":"Yingjie Zhao","orcid":"https://orcid.org/0009-0000-8336-275X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yanzhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100415363","display_name":"Yutong Chen","orcid":"https://orcid.org/0000-0002-3033-4138"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yutong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5002363712","display_name":"Zichun Wang","orcid":"https://orcid.org/0009-0009-2752-7260"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zichun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101431184"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.8788999915122986,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.8788999915122986,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.023099999874830246,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11615","display_name":"Control and Dynamics of Mobile Robots","score":0.020899999886751175,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ackermann-function","display_name":"Ackermann function","score":0.8356999754905701},{"id":"https://openalex.org/keywords/nonholonomic-system","display_name":"Nonholonomic system","score":0.7717000246047974},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.6646999716758728},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.569100022315979},{"id":"https://openalex.org/keywords/underactuation","display_name":"Underactuation","score":0.5062999725341797},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5015000104904175},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.48910000920295715},{"id":"https://openalex.org/keywords/reachability","display_name":"Reachability","score":0.42910000681877136},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4115999937057495}],"concepts":[{"id":"https://openalex.org/C33436860","wikidata":"https://www.wikidata.org/wiki/Q341835","display_name":"Ackermann function","level":3,"score":0.8356999754905701},{"id":"https://openalex.org/C138632511","wikidata":"https://www.wikidata.org/wiki/Q2478109","display_name":"Nonholonomic system","level":4,"score":0.7717000246047974},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.6646999716758728},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.569100022315979},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5683000087738037},{"id":"https://openalex.org/C88337583","wikidata":"https://www.wikidata.org/wiki/Q7883433","display_name":"Underactuation","level":3,"score":0.5062999725341797},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5015000104904175},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.48910000920295715},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.42910000681877136},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4115999937057495},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.4025999903678894},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.38830000162124634},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.3765000104904175},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3765000104904175},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.37450000643730164},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.33820000290870667},{"id":"https://openalex.org/C195065555","wikidata":"https://www.wikidata.org/wiki/Q214881","display_name":"Curvature","level":2,"score":0.33239999413490295},{"id":"https://openalex.org/C79487989","wikidata":"https://www.wikidata.org/wiki/Q934680","display_name":"Vehicle dynamics","level":2,"score":0.3310999870300293},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3000999987125397},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.28220000863075256},{"id":"https://openalex.org/C17816587","wikidata":"https://www.wikidata.org/wiki/Q1501872","display_name":"Inverse kinematics","level":3,"score":0.2773999869823456},{"id":"https://openalex.org/C58315980","wikidata":"https://www.wikidata.org/wiki/Q179436","display_name":"Asymptote","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C2776937971","wikidata":"https://www.wikidata.org/wiki/Q4384217","display_name":"Heading (navigation)","level":2,"score":0.2565999925136566}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.22338","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.22338","pdf_url":"https://arxiv.org/pdf/2511.22338","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2511.22338","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.22338","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.22338","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.22338","pdf_url":"https://arxiv.org/pdf/2511.22338","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Nonholonomic":[0],"constraints":[1,137],"restrict":[2],"feasible":[3,126],"velocities":[4],"without":[5],"reducing":[6],"configuration-space":[7],"dimension,":[8],"which":[9,71],"makes":[10],"collision-free":[11],"geometric":[12],"paths":[13],"generally":[14],"non-executable":[15],"for":[16,86],"car-like":[17],"robots.":[18],"Ackermann":[19,87,105],"steering":[20,51],"further":[21],"imposes":[22],"curvature":[23],"bounds":[24],"and":[25,40,49,62,75,89,107,138,177,182,190],"forbids":[26],"in-place":[27],"rotation,":[28],"so":[29],"escaping":[30],"from":[31],"narrow":[32,57,83,115],"dead":[33,116],"ends":[34,117],"typically":[35],"requires":[36],"tightly":[37],"sequenced":[38],"forward":[39],"reverse":[41],"maneuvers.":[42],"Classical":[43],"planners":[44,153],"that":[45,98,118,134,154],"decouple":[46],"global":[47,156],"search":[48,157],"local":[50],"struggle":[52],"in":[53],"these":[54],"settings":[55],"because":[56],"passages":[58],"occupy":[59],"low-measure":[60],"regions":[61],"nonholonomic":[63,82,159],"reachability":[64],"shrinks":[65],"the":[66,143,165,187],"set":[67],"of":[68,114,172],"valid":[69],"connections,":[70],"degrades":[72],"sampling":[73],"efficiency":[74],"increases":[76],"sensitivity":[77],"to":[78,111,121],"clearances.":[79],"We":[80,193],"study":[81],"dead-end":[84,163],"escape":[85],"vehicles":[88],"contribute":[90],"three":[91],"components.":[92],"First,":[93],"we":[94,129,148],"construct":[95,130],"a":[96,131,140,169],"generator":[97],"samples":[99],"multi-phase":[100],"forward-reverse":[101],"trajectories":[102],"compatible":[103],"with":[104,158],"kinematics":[106],"inflates":[108],"their":[109],"envelopes":[110],"synthesize":[112],"families":[113],"are":[119],"guaranteed":[120],"admit":[122],"at":[123,200],"least":[124],"one":[125],"escape.":[127],"Second,":[128],"training":[132],"environment":[133],"enforces":[135],"kinematic":[136],"train":[139],"policy":[141,167],"using":[142],"soft":[144],"actor-critic":[145],"algorithm.":[146],"Third,":[147],"evaluate":[149],"against":[150],"representative":[151],"classical":[152],"combine":[155],"steering.":[160],"Across":[161],"parameterized":[162],"families,":[164],"learned":[166],"solves":[168],"larger":[170],"fraction":[171],"instances,":[173],"reduces":[174],"maneuver":[175],"count,":[176],"maintains":[178],"comparable":[179],"path":[180],"length":[181],"planning":[183],"time":[184],"while":[185],"under":[186],"same":[188],"sensing":[189],"control":[191],"limits.":[192],"provide":[194],"our":[195],"project":[196],"as":[197],"open":[198],"source":[199],"https://github.com/gitagitty/cisDRL-RobotNav.git":[201]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-03T00:00:00"}
