{"id":"https://openalex.org/W4417131018","doi":"https://doi.org/10.1109/lra.2025.3641120","title":"Vision-Guided Outdoor Flight and Obstacle Evasion via Reinforcement Learning","display_name":"Vision-Guided Outdoor Flight and Obstacle Evasion via Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W4417131018","doi":"https://doi.org/10.1109/lra.2025.3641120"},"language":null,"primary_location":{"id":"doi:10.1109/lra.2025.3641120","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3641120","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048810975","display_name":"Shiladitya Dutta","orcid":null},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shiladitya Dutta","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]},{"raw_affiliation_string":"College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023189559","display_name":"Aayush Gupta","orcid":"https://orcid.org/0000-0001-6780-6744"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aayush Gupta","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]},{"raw_affiliation_string":"College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017660889","display_name":"Vaibhav Saran","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Varun Saran","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]},{"raw_affiliation_string":"College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008034417","display_name":"Avideh Zakhor","orcid":"https://orcid.org/0000-0003-4770-6353"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Avideh Zakhor","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, College of Engineering, University of California Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]},{"raw_affiliation_string":"College of Engineering, Department of Electrical Engineering and Computer Science, University of California Berkeley, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5048810975"],"corresponding_institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.51819467,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"2","first_page":"1202","last_page":"1209"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.501800000667572,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.501800000667572,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.06759999692440033,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12125","display_name":"Aerospace and Aviation Technology","score":0.06639999896287918,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7663000226020813},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.5},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.49549999833106995},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.49219998717308044},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.47450000047683716},{"id":"https://openalex.org/keywords/tree-traversal","display_name":"Tree traversal","score":0.43720000982284546},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.42309999465942383},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.4180000126361847},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.39149999618530273},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.39100000262260437}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7663000226020813},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6779000163078308},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5310999751091003},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.5},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.49549999833106995},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.49219998717308044},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.47450000047683716},{"id":"https://openalex.org/C140745168","wikidata":"https://www.wikidata.org/wiki/Q1210082","display_name":"Tree traversal","level":2,"score":0.43720000982284546},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.4180000126361847},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.39100000262260437},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.38269999623298645},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3447999954223633},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.3278000056743622},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.32760000228881836},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32269999384880066},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.3197999894618988},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.303600013256073},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2939000129699707},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2890999913215637},{"id":"https://openalex.org/C92991967","wikidata":"https://www.wikidata.org/wiki/Q7644329","display_name":"Supervisory control","level":3,"score":0.2833999991416931},{"id":"https://openalex.org/C49441653","wikidata":"https://www.wikidata.org/wiki/Q2014717","display_name":"Odometry","level":4,"score":0.2809999883174896},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2732999920845032},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27149999141693115},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2639999985694885},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.26350000500679016},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C79487989","wikidata":"https://www.wikidata.org/wiki/Q934680","display_name":"Vehicle dynamics","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.25270000100135803},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.25099998712539673},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.25040000677108765},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2025.3641120","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3641120","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2482392012","https://openalex.org/W2582119245","https://openalex.org/W2788239209","https://openalex.org/W2951360122","https://openalex.org/W2963249250","https://openalex.org/W2967452881","https://openalex.org/W2991625383","https://openalex.org/W3009542919","https://openalex.org/W3131526549","https://openalex.org/W3202883604","https://openalex.org/W4220923746","https://openalex.org/W4383066575","https://openalex.org/W4383108878","https://openalex.org/W4389665475","https://openalex.org/W4389665598","https://openalex.org/W4396910019","https://openalex.org/W4401414021","https://openalex.org/W4401416465","https://openalex.org/W4405778711","https://openalex.org/W4405778892","https://openalex.org/W4408254239","https://openalex.org/W4411055067"],"related_works":[],"abstract_inverted_index":{"Although":[0],"quadcopters":[1],"boast":[2],"impressive":[3],"traversal":[4],"capabilities":[5],"enabled":[6],"by":[7,72,87,116],"their":[8,21],"omnidirectional":[9],"maneuverability,":[10],"the":[11,68,101,135],"need":[12],"for":[13],"continuous":[14],"pilot":[15],"control":[16,76],"in":[17,23,50,103,129],"complex":[18],"environments":[19,170],"impedes":[20],"application":[22],"GNSS":[24],"and":[25,41,75,95,142,155,171],"telemetry-denied":[26],"scenarios.":[27],"To":[28,133],"this":[29],"end,":[30],"we":[31,138],"propose":[32],"a":[33,56,64,73,106,117,123,130,147,172],"novel":[34],"sensorimotor":[35],"policy":[36,60,102,148],"that":[37,83,149,175],"uses":[38],"stereo-vision":[39],"depth":[40],"visual-inertial":[42],"odometry":[43],"(VIO)":[44],"to":[45,54,99,145,153,167],"autonomously":[46],"navigate":[47],"through":[48,105],"obstacles":[49],"an":[51,88],"unknown":[52],"environment":[53],"reach":[55],"goal":[57],"point.":[58],"The":[59],"is":[61,150],"comprised":[62],"of":[63],"pre-trained":[65],"autoencoder":[66],"as":[67,122],"perception":[69],"head":[70],"followed":[71,86],"planning":[74],"LSTM":[77],"network":[78],"which":[79],"outputs":[80],"velocity":[81],"commands":[82],"can":[84],"be":[85],"off-the-shelf":[89],"commercial":[90],"drone.":[91],"We":[92],"leverage":[93],"reinforcement":[94],"privileged":[96],"learning":[97],"paradigms":[98],"train":[100],"simulation":[104],"two-stage":[107],"process:":[108],"1)":[109],"initial":[110],"training":[111],"with":[112],"optimal":[113],"trajectories":[114],"generated":[115],"global":[118],"motion":[119],"planner":[120],"acting":[121],"supervisory":[124],"backbone,":[125],"2)":[126],"further":[127],"fine-tuning":[128],"curriculum":[131],"environment.":[132],"bridge":[134],"sim-to-real":[136],"gap,":[137],"employ":[139],"domain":[140,156],"randomization":[141],"reward":[143],"shaping":[144],"create":[146],"both":[151,168],"robust":[152],"noise":[154],"shift.":[157],"In":[158],"outdoor":[159],"experiments,":[160],"our":[161],"approach":[162],"achieves":[163],"successful":[164],"zero-shot":[165],"transfer":[166],"obstacle":[169],"drone":[173],"platform":[174],"were":[176],"never":[177],"encountered":[178],"during":[179],"training.":[180]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-08T00:00:00"}
