{"id":"https://openalex.org/W4402626843","doi":"https://doi.org/10.1109/access.2024.3463732","title":"Reinforcement Learning for Autonomous Agents: Scene-Specific Dynamic Obstacle Avoidance and Target Pursuit in Unknown Environments","display_name":"Reinforcement Learning for Autonomous Agents: Scene-Specific Dynamic Obstacle Avoidance and Target Pursuit in Unknown Environments","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402626843","doi":"https://doi.org/10.1109/access.2024.3463732"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3463732","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3463732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dx.doi.org/10.1109/access.2024.3463732","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091904867","display_name":"Zixiang Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zixiang Tang","raw_affiliation_strings":["School of Computer Science and Technology, Hainan University, Hainan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Hainan University, Hainan, China","institution_ids":["https://openalex.org/I20942203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018541733","display_name":"Fa Fu","orcid":"https://orcid.org/0000-0002-4811-7692"},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fa Fu","raw_affiliation_strings":["School of Computer Science and Technology, Hainan University, Hainan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Hainan University, Hainan, China","institution_ids":["https://openalex.org/I20942203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111105698","display_name":"Gaoshang Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaoshang Lu","raw_affiliation_strings":["School of Computer Science and Technology, Hainan University, Hainan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Hainan University, Hainan, China","institution_ids":["https://openalex.org/I20942203"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034940430","display_name":"D. Chen","orcid":"https://orcid.org/0000-0002-3682-172X"},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Da Chen","raw_affiliation_strings":["School of Computer Science and Technology, Hainan University, Hainan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Hainan University, Hainan, China","institution_ids":["https://openalex.org/I20942203"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5091904867"],"corresponding_institution_ids":["https://openalex.org/I20942203"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.0245,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.80740933,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"12","issue":null,"first_page":"145496","last_page":"145510"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9363999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9363999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7701227068901062},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.7548305988311768},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.7085427045822144},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7010951042175293},{"id":"https://openalex.org/keywords/smooth-pursuit","display_name":"Smooth pursuit","score":0.6685037612915039},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5172058343887329},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4442134499549866},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3664143979549408},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.2779896855354309},{"id":"https://openalex.org/keywords/eye-movement","display_name":"Eye movement","score":0.11606565117835999},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.0807146430015564},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.07977375388145447}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7701227068901062},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.7548305988311768},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.7085427045822144},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7010951042175293},{"id":"https://openalex.org/C10324989","wikidata":"https://www.wikidata.org/wiki/Q3400677","display_name":"Smooth pursuit","level":3,"score":0.6685037612915039},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5172058343887329},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4442134499549866},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3664143979549408},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2779896855354309},{"id":"https://openalex.org/C153050134","wikidata":"https://www.wikidata.org/wiki/Q760256","display_name":"Eye movement","level":2,"score":0.11606565117835999},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0807146430015564},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.07977375388145447}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3463732","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3463732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:7f721f2b9b004cafb9529175e4087021","is_oa":true,"landing_page_url":"https://doaj.org/article/7f721f2b9b004cafb9529175e4087021","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 145496-145510 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3463732","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3463732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.46000000834465027,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G3541521188","display_name":null,"funder_award_id":"2022-007","funder_id":"https://openalex.org/F4320327832","funder_display_name":"Shantou Science and Technology Project"}],"funders":[{"id":"https://openalex.org/F4320327832","display_name":"Shantou Science and Technology Project","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2913749762","https://openalex.org/W2321940404","https://openalex.org/W2140606111","https://openalex.org/W2991662304","https://openalex.org/W2794689129","https://openalex.org/W2785353696","https://openalex.org/W2355860162","https://openalex.org/W2022120107","https://openalex.org/W2624388109","https://openalex.org/W2102947728"],"abstract_inverted_index":{"This":[0,50,162],"research":[1],"presents":[2],"a":[3,69,103,125,152],"novel":[4],"approach":[5,123,163],"to":[6,42,89,112,131],"train":[7],"autonomous":[8,160],"agents":[9],"in":[10,55,159],"complex":[11,44,75,166],"and":[12,22,36,46,60,82],"unknown":[13],"environments,":[14],"focusing":[15],"on":[16],"scene-specific":[17,70],"learning,":[18],"dynamic":[19],"obstacle":[20],"avoidance,":[21],"target":[23],"tracking.":[24],"Traditional":[25],"reinforcement":[26,133,167],"learning":[27,71,147,158,168],"(RL)":[28],"methods":[29],"often":[30],"suffer":[31],"from":[32],"high":[33],"time":[34,140],"complexity":[35],"inefficiency,":[37],"which":[38,106],"hinder":[39],"agents\u2019":[40],"ability":[41],"learn":[43],"behaviors":[45,87],"understand":[47],"their":[48],"interconnections.":[49],"limitation":[51],"creates":[52],"significant":[53],"challenges":[54],"environments":[56],"requiring":[57],"rapid":[58],"adaptation":[59],"multifaceted":[61],"responses.":[62],"To":[63],"address":[64],"these":[65],"issues,":[66],"we":[67],"propose":[68],"framework":[72,145],"that":[73,121],"decomposes":[74],"scenes":[76],"into":[77,98,102],"sub-scenes,":[78],"enabling":[79],"targeted":[80],"training":[81,139],"the":[83,109,114],"acquisition":[84],"of":[85],"distinct":[86],"linked":[88],"various":[90],"models.":[91],"In":[92],"intricate":[93],"scenarios,":[94],"observations":[95],"are":[96],"transformed":[97],"specific":[99],"signals":[100],"fed":[101],"state":[104],"machine,":[105],"then":[107],"invokes":[108],"appropriate":[110],"model":[111],"generate":[113],"required":[115],"actions.":[116],"Firstly,":[117],"our":[118],"experiments":[119],"demonstrate":[120],"this":[122,143],"achieves":[124],"70%":[126],"faster":[127],"convergence":[128],"rate":[129],"compared":[130],"direct":[132],"learning.":[134],"Secondly,":[135],"it":[136],"significantly":[137],"reduces":[138],"complexity.":[141],"Thirdly,":[142],"structured":[144],"enhances":[146],"efficiency":[148],"and,":[149],"lastly,":[150],"provides":[151],"scalable":[153],"solution":[154],"for":[155],"sophisticated":[156],"multi-task":[157],"systems.":[161],"effectively":[164],"addresses":[165],"challenges.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
