{"id":"https://openalex.org/W4417297073","doi":"https://doi.org/10.48550/arxiv.2512.10934","title":"Curriculum-Based Reinforcement Learning for Autonomous UAV Navigation in Unknown Curved Tubular Conduit","display_name":"Curriculum-Based Reinforcement Learning for Autonomous UAV Navigation in Unknown Curved Tubular Conduit","publication_year":2025,"publication_date":"2025-12-11","ids":{"openalex":"https://openalex.org/W4417297073","doi":"https://doi.org/10.48550/arxiv.2512.10934"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2512.10934","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.10934","pdf_url":"https://arxiv.org/pdf/2512.10934","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.10934","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067484998","display_name":"Zamirddine Mari","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mari, Zamirddine","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108113352","display_name":"J\u00e9r\u00f4me Pasquet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pasquet, J\u00e9r\u00f4me","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045275862","display_name":"Julien Seinturier","orcid":"https://orcid.org/0000-0002-8996-6287"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seinturier, Julien","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5067484998"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.5831000208854675,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.5831000208854675,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.1599999964237213,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.0340999998152256,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.7339000105857849},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.7296000123023987},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6205000281333923},{"id":"https://openalex.org/keywords/lidar","display_name":"Lidar","score":0.5726000070571899},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5508999824523926},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5507000088691711},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.40299999713897705},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.3799000084400177},{"id":"https://openalex.org/keywords/course","display_name":"Course (navigation)","score":0.3783999979496002}],"concepts":[{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.7339000105857849},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.7296000123023987},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6205000281333923},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6080999970436096},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.5726000070571899},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5627999901771545},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5508999824523926},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5507000088691711},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.521399974822998},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.40299999713897705},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.3799000084400177},{"id":"https://openalex.org/C2777552389","wikidata":"https://www.wikidata.org/wiki/Q1962728","display_name":"Course (navigation)","level":2,"score":0.3783999979496002},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.35600000619888306},{"id":"https://openalex.org/C61272859","wikidata":"https://www.wikidata.org/wiki/Q7834031","display_name":"Transferability","level":3,"score":0.3490000069141388},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.33649998903274536},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3246000111103058},{"id":"https://openalex.org/C2778361833","wikidata":"https://www.wikidata.org/wiki/Q34735","display_name":"Compass","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C2776010242","wikidata":"https://www.wikidata.org/wiki/Q4677575","display_name":"Active perception","level":3,"score":0.2996000051498413},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C9770341","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Geospatial analysis","level":2,"score":0.29420000314712524},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.28600001335144043},{"id":"https://openalex.org/C2777891301","wikidata":"https://www.wikidata.org/wiki/Q3475123","display_name":"Navigation system","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2655999958515167},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.26100000739097595},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2558000087738037},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2512.10934","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.10934","pdf_url":"https://arxiv.org/pdf/2512.10934","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.10934","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.10934","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.10934","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.10934","pdf_url":"https://arxiv.org/pdf/2512.10934","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Autonomous":[0],"drone":[1,40],"navigation":[2,156,214],"in":[3,186,215],"confined":[4],"tubular":[5,217],"environments":[6,218],"remains":[7],"a":[8,34,39,61,77,104,112,187,200,209,237],"major":[9],"challenge":[10],"due":[11],"to":[12,29,41,84,92,98,121,182,199],"the":[13,17,19,22,25,66,71,85,94,101,126,132,140,165,175,193,196],"constraining":[14],"geometry":[15],"of":[16,21,50,65,96,103,142,195],"conduits,":[18],"proximity":[20],"walls,":[23],"and":[24,60,147,170,219,232],"perceptual":[26],"limitations":[27],"inherent":[28],"such":[30,158],"scenarios.":[31],"We":[32],"propose":[33],"reinforcement":[35],"learning":[36],"approach":[37,206],"enabling":[38],"navigate":[42],"unknown":[43,216],"three-dimensional":[44],"tubes":[45],"without":[46],"any":[47],"prior":[48],"knowledge":[49],"their":[51],"geometry,":[52],"relying":[53],"solely":[54],"on":[55,139],"local":[56],"observations":[57],"from":[58,81,131],"LiDAR":[59,148],"conditional":[62],"visual":[63,133],"detection":[64],"tube":[67,127],"center.":[68],"In":[69],"contrast,":[70],"Pure":[72],"Pursuit":[73],"algorithm,":[74],"used":[75],"as":[76],"deterministic":[78,176],"baseline,":[79],"benefits":[80],"explicit":[82],"access":[83,181],"centerline,":[86],"creating":[87],"an":[88],"information":[89],"asymmetry":[90],"designed":[91],"assess":[93],"ability":[95],"RL":[97],"compensate":[99],"for":[100,153,212,222],"absence":[102],"geometric":[105,183],"model.":[106],"The":[107,204],"agent":[108],"is":[109],"trained":[110],"through":[111,230],"progressive":[113],"Curriculum":[114],"Learning":[115],"strategy":[116],"that":[117,164],"gradually":[118],"exposes":[119],"it":[120],"increasingly":[122],"curved":[123],"geometries,":[124],"where":[125,228],"center":[128],"frequently":[129],"disappears":[130],"field.":[134],"A":[135],"turning-negotiation":[136],"mechanism,":[137],"based":[138],"combination":[141],"direct":[143],"visibility,":[144],"directional":[145],"memory,":[146],"symmetry":[149],"cues,":[150],"proves":[151],"essential":[152],"ensuring":[154],"stable":[155],"under":[157],"partial":[159],"observability":[160],"conditions.":[161],"Experiments":[162],"show":[163],"PPO":[166],"policy":[167],"acquires":[168],"robust":[169],"generalizable":[171],"behavior,":[172],"consistently":[173],"outperforming":[174],"controller":[177],"despite":[178],"its":[179],"limited":[180],"information.":[184],"Validation":[185],"high-fidelity":[188],"3D":[189],"environment":[190],"further":[191],"confirms":[192],"transferability":[194],"learned":[197],"behavior":[198],"continuous":[201],"physical":[202],"dynamics.":[203],"proposed":[205],"thus":[207],"provides":[208],"complete":[210],"framework":[211],"autonomous":[213],"opens":[220],"perspectives":[221],"industrial,":[223],"underground,":[224],"or":[225],"medical":[226],"applications":[227],"progressing":[229],"narrow":[231],"weakly":[233],"perceptive":[234],"conduits":[235],"represents":[236],"central":[238],"challenge.":[239]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-13T00:00:00"}
