{"id":"https://openalex.org/W3114597659","doi":"https://doi.org/10.1109/ictc49870.2020.9289571","title":"Limit Action Space to Enhance Drone Control with Deep Reinforcement Learning","display_name":"Limit Action Space to Enhance Drone Control with Deep Reinforcement Learning","publication_year":2020,"publication_date":"2020-10-21","ids":{"openalex":"https://openalex.org/W3114597659","doi":"https://doi.org/10.1109/ictc49870.2020.9289571","mag":"3114597659"},"language":"en","primary_location":{"id":"doi:10.1109/ictc49870.2020.9289571","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictc49870.2020.9289571","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Conference on Information and Communication Technology Convergence (ICTC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070677616","display_name":"Sooyoung Jang","orcid":"https://orcid.org/0000-0002-6931-9592"},"institutions":[{"id":"https://openalex.org/I142401562","display_name":"Electronics and Telecommunications Research Institute","ror":"https://ror.org/03ysstz10","country_code":"KR","type":"facility","lineage":["https://openalex.org/I142401562","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Sooyoung Jang","raw_affiliation_strings":["Intelligence Convergence Research Laboratory, Electronics and Telecommunications Research Institute (ETRI), Daejeon, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Intelligence Convergence Research Laboratory, Electronics and Telecommunications Research Institute (ETRI), Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I142401562"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027995571","display_name":"Noh-Sam Park","orcid":null},"institutions":[{"id":"https://openalex.org/I142401562","display_name":"Electronics and Telecommunications Research Institute","ror":"https://ror.org/03ysstz10","country_code":"KR","type":"facility","lineage":["https://openalex.org/I142401562","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Noh-Sam Park","raw_affiliation_strings":["Intelligence Convergence Research Laboratory, Electronics and Telecommunications Research Institute (ETRI), Daejeon, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Intelligence Convergence Research Laboratory, Electronics and Telecommunications Research Institute (ETRI), Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I142401562"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5070677616"],"corresponding_institution_ids":["https://openalex.org/I142401562"],"apc_list":null,"apc_paid":null,"fwci":0.1326,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57112363,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1212","last_page":"1215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8936042189598083},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.7786054015159607},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.7365512251853943},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6935358047485352},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.6573633551597595},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.6517235636711121},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.6205005645751953},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.538821816444397},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.47783923149108887},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.43419772386550903},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17391663789749146},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15826234221458435}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8936042189598083},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.7786054015159607},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.7365512251853943},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6935358047485352},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.6573633551597595},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.6517235636711121},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.6205005645751953},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.538821816444397},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.47783923149108887},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.43419772386550903},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17391663789749146},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15826234221458435},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ictc49870.2020.9289571","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictc49870.2020.9289571","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Conference on Information and Communication Technology Convergence (ICTC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2736601468","https://openalex.org/W2811374584","https://openalex.org/W2901563868","https://openalex.org/W2962890638","https://openalex.org/W2963094322","https://openalex.org/W6741002519","https://openalex.org/W6752963931"],"related_works":["https://openalex.org/W4229448053","https://openalex.org/W4247925126","https://openalex.org/W4327774218","https://openalex.org/W2059768187","https://openalex.org/W4312858960","https://openalex.org/W4386036939","https://openalex.org/W4379143281","https://openalex.org/W2605096541","https://openalex.org/W3200286695","https://openalex.org/W4212885606"],"abstract_inverted_index":{"Although":[0],"many":[1],"research":[2],"progresses":[3],"on":[4,91],"deep":[5,65],"reinforcement":[6,66],"learning,":[7],"it":[8],"is":[9],"not":[10],"yet":[11],"perfect.":[12],"It":[13],"may":[14],"take":[15],"too":[16],"much":[17],"time":[18],"or":[19],"even":[20],"fail":[21],"to":[22,76,81,117],"solve":[23],"the":[24,28,33,40,53,77,83,87,110,114,119],"problem.":[25],"Therefore,":[26],"simplifying":[27],"problem":[29],"by":[30,108],"intentionally":[31],"limiting":[32,86,109],"agent's":[34,88],"action":[35,57,73,89],"space":[36,58,90],"should":[37],"help":[38],"train":[39],"agent":[41,115],"efficiently":[42],"and":[43,98,102,126,132],"effectively.":[44],"To":[45],"verify":[46],"that,":[47],"in":[48],"this":[49],"paper,":[50],"we":[51],"analyze":[52,82],"performances":[54],"of":[55,79,85,112],"various":[56],"designs":[59],"for":[60],"controlling":[61],"a":[62,128],"drone":[63],"with":[64,122],"learning.":[67],"We":[68,105],"have":[69],"designed":[70],"six":[71],"different":[72],"spaces":[74],"according":[75],"degree":[78,111],"freedom":[80],"effect":[84],"performance":[92],"metrics":[93],"such":[94],"as":[95],"travel":[96,124],"distance":[97,125],"time,":[99],"goal":[100,120,130],"rate,":[101],"total":[103],"reward.":[104,133],"show":[106],"that":[107],"freedom,":[113],"learns":[116],"reach":[118],"faster":[121],"less":[123],"achieve":[127],"higher":[129],"rate":[131]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
