{"id":"https://openalex.org/W3186325801","doi":"https://doi.org/10.1109/tsmc.2021.3096935","title":"An Improved Dyna-<i>Q</i> Algorithm for Mobile Robot Path Planning in Unknown Dynamic Environment","display_name":"An Improved Dyna-<i>Q</i> Algorithm for Mobile Robot Path Planning in Unknown Dynamic Environment","publication_year":2021,"publication_date":"2021-07-26","ids":{"openalex":"https://openalex.org/W3186325801","doi":"https://doi.org/10.1109/tsmc.2021.3096935","mag":"3186325801"},"language":"en","primary_location":{"id":"doi:10.1109/tsmc.2021.3096935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2021.3096935","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052963938","display_name":"Muleilan Pei","orcid":"https://orcid.org/0000-0002-7721-6251"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Muleilan Pei","raw_affiliation_strings":["Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0002-7721-6251","affiliations":[{"raw_affiliation_string":"Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066550564","display_name":"Hao An","orcid":"https://orcid.org/0000-0003-0919-2283"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao An","raw_affiliation_strings":["Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0003-0919-2283","affiliations":[{"raw_affiliation_string":"Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100461752","display_name":"Bo Liu","orcid":"https://orcid.org/0000-0003-4006-1126"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Liu","raw_affiliation_strings":["Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0003-4006-1126","affiliations":[{"raw_affiliation_string":"Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100427143","display_name":"Changhong Wang","orcid":"https://orcid.org/0000-0002-9534-6711"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changhong Wang","raw_affiliation_strings":["Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0002-9534-6711","affiliations":[{"raw_affiliation_string":"Space Control and Inertial Technology Research Center, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":5.6279,"has_fulltext":false,"cited_by_count":96,"citation_normalized_percentile":{"value":0.97045924,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"52","issue":"7","first_page":"4415","last_page":"4425"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.5888059735298157},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5578159093856812},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4593629240989685},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4520416855812073},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4417344033718109},{"id":"https://openalex.org/keywords/simulated-annealing","display_name":"Simulated annealing","score":0.41511139273643494},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.396472692489624},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.39201515913009644},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.10639289021492004}],"concepts":[{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.5888059735298157},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5578159093856812},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4593629240989685},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4520416855812073},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4417344033718109},{"id":"https://openalex.org/C126980161","wikidata":"https://www.wikidata.org/wiki/Q863783","display_name":"Simulated annealing","level":2,"score":0.41511139273643494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.396472692489624},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.39201515913009644},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.10639289021492004},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2021.3096935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2021.3096935","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4588764917","display_name":null,"funder_award_id":"SKLRS201801A05","funder_id":"https://openalex.org/F4320327001","funder_display_name":"State Key Laboratory of Robotics and System"},{"id":"https://openalex.org/G6055139975","display_name":null,"funder_award_id":"61903101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G778607359","display_name":null,"funder_award_id":"BX201700064","funder_id":"https://openalex.org/F4320335768","funder_display_name":"National Postdoctoral Program for Innovative Talents"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320327001","display_name":"State Key Laboratory of Robotics and System","ror":null},{"id":"https://openalex.org/F4320335768","display_name":"National Postdoctoral Program for Innovative Talents","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W41554520","https://openalex.org/W1589747210","https://openalex.org/W1681019253","https://openalex.org/W1901616594","https://openalex.org/W1980035368","https://openalex.org/W1997880753","https://openalex.org/W2005228957","https://openalex.org/W2059530451","https://openalex.org/W2084474153","https://openalex.org/W2101938656","https://openalex.org/W2106155860","https://openalex.org/W2107726111","https://openalex.org/W2413992829","https://openalex.org/W2466175722","https://openalex.org/W2592496730","https://openalex.org/W2623293810","https://openalex.org/W2766447205","https://openalex.org/W2773987374","https://openalex.org/W2800142021","https://openalex.org/W2810602713","https://openalex.org/W2911087563","https://openalex.org/W2911549659","https://openalex.org/W2917089854","https://openalex.org/W2963302368","https://openalex.org/W2968601742","https://openalex.org/W2999778183","https://openalex.org/W3099518626","https://openalex.org/W3100751385","https://openalex.org/W3111294788","https://openalex.org/W3111570917","https://openalex.org/W4230167402","https://openalex.org/W4246917522","https://openalex.org/W6634211352","https://openalex.org/W6750106230","https://openalex.org/W6756486208"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2504004674","https://openalex.org/W1987679298","https://openalex.org/W2073681303","https://openalex.org/W2963177394","https://openalex.org/W4313359513","https://openalex.org/W2498744856","https://openalex.org/W4390482104","https://openalex.org/W322408318","https://openalex.org/W149041114"],"abstract_inverted_index":{"This":[0],"article":[1],"deals":[2],"with":[3,78,87,153],"the":[4,61,79,88,97,102,121,178,193],"problem":[5],"of":[6,104],"mobile":[7,179],"robot":[8,168,175,180],"path":[9,113],"planning":[10],"in":[11,139,157,192],"an":[12,29,140,150],"unknown":[13,141],"environment":[14,152],"that":[15],"contains":[16],"both":[17],"static":[18,142],"and":[19,47,92,100,109,130,144,167,177],"dynamic":[20,155],"obstacles,":[21],"utilizing":[22],"a":[23,173,184],"reinforcement":[24],"learning":[25,110],"approach.":[26],"We":[27],"propose":[28],"improved":[30],"Dyna-":[31,131],"<inline-formula":[32,52,69,123,132],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[33,53,70,124,133],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[34,54,71,125,134],"<tex-math":[35,55,72,126,135],"notation=\"LaTeX\">${Q}$":[36,56,127,136],"</tex-math></inline-formula>":[37,57,75,128,137],"algorithm,":[38],"which":[39],"incorporates":[40],"heuristic":[41,89,93],"search":[42],"strategies,":[43],"simulated":[44],"annealing":[45],"mechanism,":[46],"reactive":[48],"navigation":[49,190],"principle":[50],"into":[51],"-learning":[58,129],"based":[59],"on":[60,172],"Dyna":[62],"architecture.":[63],"A":[64],"novel":[65],"action-selection":[66],"strategy":[67],"combining":[68],"notation=\"LaTeX\">$\\varepsilon":[73],"$":[74],"-greedy":[76],"policy":[77],"cooling":[80],"schedule":[81],"control":[82],"is":[83,118,146],"presented,":[84],"which,":[85],"together":[86],"reward":[90],"function":[91],"actions,":[94],"can":[95],"tackle":[96],"exploration-exploitation":[98],"dilemma":[99],"enhance":[101],"performance":[103],"global":[105],"searching,":[106],"convergence":[107],"property,":[108],"efficiency":[111],"for":[112],"planning.":[114],"The":[115],"proposed":[116],"method":[117],"superior":[119],"to":[120,149,182],"classical":[122],"algorithms":[138],"environment,":[143],"it":[145],"successfully":[147],"applied":[148],"uncertain":[151],"multiple":[154],"obstacles":[156],"simulations.":[158],"Further,":[159],"practical":[160],"experiments":[161],"are":[162],"conducted":[163],"by":[164],"integrating":[165],"MATLAB":[166],"operating":[169],"system":[170],"(ROS)":[171],"physical":[174],"platform,":[176],"manages":[181],"find":[183],"collision-free":[185],"path,":[186],"thus":[187],"fulfilling":[188],"autonomous":[189],"tasks":[191],"real":[194],"world.":[195]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":8}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
