{"id":"https://openalex.org/W4399769714","doi":"https://doi.org/10.1109/icara60736.2024.10553074","title":"Sim-to-Real Deep Reinforcement Learning Based Obstacle Avoidance for UAVs Under Measurement Uncertainty","display_name":"Sim-to-Real Deep Reinforcement Learning Based Obstacle Avoidance for UAVs Under Measurement Uncertainty","publication_year":2024,"publication_date":"2024-02-22","ids":{"openalex":"https://openalex.org/W4399769714","doi":"https://doi.org/10.1109/icara60736.2024.10553074"},"language":"en","primary_location":{"id":"doi:10.1109/icara60736.2024.10553074","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icara60736.2024.10553074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 10th International Conference on Automation, Robotics and Applications (ICARA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088763781","display_name":"Bhaskar Joshi","orcid":"https://orcid.org/0009-0004-1743-7265"},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Bhaskar Joshi","raw_affiliation_strings":["RRC, IIIT,Hyderabad","RRC, IIIT, Hyderabad"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RRC, IIIT,Hyderabad","institution_ids":["https://openalex.org/I65181880"]},{"raw_affiliation_string":"RRC, IIIT, Hyderabad","institution_ids":["https://openalex.org/I65181880"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043127138","display_name":"Dhruv Kapur","orcid":null},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Dhruv Kapur","raw_affiliation_strings":["RRC, IIIT,Hyderabad","RRC, IIIT, Hyderabad"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RRC, IIIT,Hyderabad","institution_ids":["https://openalex.org/I65181880"]},{"raw_affiliation_string":"RRC, IIIT, Hyderabad","institution_ids":["https://openalex.org/I65181880"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026782960","display_name":"Harikumar Kandath","orcid":"https://orcid.org/0000-0002-5500-7133"},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Harikumar Kandath","raw_affiliation_strings":["RRC, IIIT,Hyderabad","RRC, IIIT, Hyderabad"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RRC, IIIT,Hyderabad","institution_ids":["https://openalex.org/I65181880"]},{"raw_affiliation_string":"RRC, IIIT, Hyderabad","institution_ids":["https://openalex.org/I65181880"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.406,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89920101,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"278","last_page":"284"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.8191018104553223},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7933810949325562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6031002998352051},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.557070791721344},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.5143293142318726},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.49956297874450684},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.1997046172618866},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.17023137211799622},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.1636269986629486}],"concepts":[{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.8191018104553223},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7933810949325562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6031002998352051},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.557070791721344},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.5143293142318726},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.49956297874450684},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.1997046172618866},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.17023137211799622},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.1636269986629486},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icara60736.2024.10553074","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icara60736.2024.10553074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 10th International Conference on Automation, Robotics and Applications (ICARA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.6499999761581421,"display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1484503832","https://openalex.org/W1977655452","https://openalex.org/W2105934661","https://openalex.org/W2181005557","https://openalex.org/W2553522096","https://openalex.org/W2736601468","https://openalex.org/W2916826721","https://openalex.org/W2975816184","https://openalex.org/W2996195849","https://openalex.org/W3000498189","https://openalex.org/W3036868238","https://openalex.org/W3153187775","https://openalex.org/W3207833010","https://openalex.org/W3216772467","https://openalex.org/W4220806879","https://openalex.org/W6804601995"],"related_works":["https://openalex.org/W2930076404","https://openalex.org/W4253519380","https://openalex.org/W2071957557","https://openalex.org/W2596413128","https://openalex.org/W4391249562","https://openalex.org/W2356867392","https://openalex.org/W2913749762","https://openalex.org/W2321940404","https://openalex.org/W2782776446","https://openalex.org/W3043170174"],"abstract_inverted_index":{"Deep":[0,28],"Reinforcement":[1,29],"Learning":[2,30],"is":[3,56,97],"quickly":[4],"becoming":[5],"a":[6,60,75,196,208],"popular":[7],"method":[8],"for":[9,38,49,104],"training":[10,161],"autonomous":[11],"Unmanned":[12],"Aerial":[13],"Vehicles":[14],"(UAVs).":[15],"Our":[16],"work":[17],"analyzes":[18],"the":[19,25,46,72,80,109,118,127,137,150,165,176,182,190,205],"effects":[20,119],"of":[21,27,74,102,111,114,120,139,164,185],"measurement":[22],"uncertainty":[23,41],"on":[24],"performance":[26,73,135,156],"(DRL)":[31],"based":[32],"waypoint":[33],"navigation":[34,171],"and":[35,51,68,92,131,162,203],"obstacle":[36],"avoidance":[37],"UAVs.":[39],"Measurement":[40,54],"originates":[42],"from":[43],"noise":[44,148],"in":[45,86,108,136,157,175,193,207],"sensors":[47],"used":[48],"localization":[50],"detecting":[52],"obstacles.":[53],"uncertainty/noise":[55],"considered":[57],"to":[58,116],"follow":[59],"Gaussian":[61],"probability":[62],"distribution":[63],"with":[64,89,99],"unknown":[65],"non-zero":[66],"mean":[67],"variance.":[69],"We":[70],"evaluate":[71,181],"DRL":[76,166],"agent,":[77],"trained":[78,192],"using":[79],"Proximal":[81],"Policy":[82],"Optimization":[83],"(PPO)":[84],"algorithm":[85],"an":[87],"environment":[88,96],"continuous":[90],"state":[91],"action":[93],"spaces.":[94],"The":[95],"randomized":[98],"different":[100],"numbers":[101],"obstacles":[103],"each":[105],"simulation":[106,194],"episode":[107],"presence":[110,138],"varying":[112],"degrees":[113],"noise,":[115],"capture":[117],"realistic":[121],"sensor":[122],"measurements.":[123],"Denoising":[124],"techniques":[125],"like":[126],"low":[128],"pass":[129],"filter":[130,133],"Kalman":[132],"improve":[134],"unbiased":[140],"noise.":[141],"Moreover,":[142],"we":[143,188],"show":[144],"that":[145],"artificially":[146],"injecting":[147],"into":[149],"measurements":[151],"during":[152],"evaluation":[153],"actually":[154],"improves":[155],"certain":[158],"scenarios.":[159],"Extensive":[160],"testing":[163],"agent":[167],"under":[168],"various":[169],"UAV":[170,198],"scenarios":[172],"are":[173],"performed":[174],"PyBullet":[177],"physics":[178],"simulator.":[179],"To":[180],"practical":[183],"validity":[184],"our":[186],"method,":[187],"port":[189],"policy":[191],"onto":[195],"real":[197],"without":[199],"any":[200],"further":[201],"modifications":[202],"verify":[204],"results":[206],"real-world":[209],"environment.":[210]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
