{"id":"https://openalex.org/W4416250847","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228238","title":"Mutual Information and Trajectory-Awared Reinforcement Learning for Multi-Agent Path Finding","display_name":"Mutual Information and Trajectory-Awared Reinforcement Learning for Multi-Agent Path Finding","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416250847","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228238"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11228238","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228238","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102881974","display_name":"Chuang Zhao","orcid":"https://orcid.org/0000-0002-7308-4757"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuang Zhao","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Computer Science and Technology,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Computer Science and Technology,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112116986","display_name":"Ying Liu","orcid":"https://orcid.org/0000-0003-3987-0954"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Liu","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Computer Science and Technology,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Computer Science and Technology,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102881974"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37368939,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9732999801635742,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9732999801635742,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.0044999998062849045,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.00430000014603138,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8313999772071838},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5169000029563904},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4645000100135803},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4523000121116638},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.40610000491142273},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.40059998631477356},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.3709999918937683},{"id":"https://openalex.org/keywords/mobile-robot-navigation","display_name":"Mobile robot navigation","score":0.3684000074863434}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8313999772071838},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6611999869346619},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5169000029563904},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5101000070571899},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4645000100135803},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4523000121116638},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.40610000491142273},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.40059998631477356},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.3709999918937683},{"id":"https://openalex.org/C26990112","wikidata":"https://www.wikidata.org/wiki/Q6887224","display_name":"Mobile robot navigation","level":5,"score":0.3684000074863434},{"id":"https://openalex.org/C25321074","wikidata":"https://www.wikidata.org/wiki/Q1969601","display_name":"Pathfinding","level":4,"score":0.36230000853538513},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3206000030040741},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.30489999055862427},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.29760000109672546},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27799999713897705},{"id":"https://openalex.org/C192126672","wikidata":"https://www.wikidata.org/wiki/Q1068715","display_name":"Telecommunications network","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C2777891301","wikidata":"https://www.wikidata.org/wiki/Q3475123","display_name":"Navigation system","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2551000118255615}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11228238","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228238","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W1989407213","https://openalex.org/W1990186220","https://openalex.org/W2030775133","https://openalex.org/W2123030512","https://openalex.org/W2155992093","https://openalex.org/W2575733488","https://openalex.org/W2809708768","https://openalex.org/W2892258706","https://openalex.org/W2914296650","https://openalex.org/W2963809389","https://openalex.org/W2963821308","https://openalex.org/W2964211993","https://openalex.org/W2964945728","https://openalex.org/W2964997335","https://openalex.org/W3023923733","https://openalex.org/W3088197938","https://openalex.org/W3092786062","https://openalex.org/W3129616587","https://openalex.org/W3206082228","https://openalex.org/W3212192385","https://openalex.org/W4221155367","https://openalex.org/W4283789768","https://openalex.org/W4389689571"],"related_works":[],"abstract_inverted_index":{"The":[0,156],"multi-agent":[1,31,107],"pathfinding":[2],"problem":[3],"(MAPF)":[4],"has":[5,34],"been":[6],"widely":[7],"used":[8],"in":[9,44,81],"large-scale":[10],"robotic":[11],"systems,":[12],"such":[13],"as":[14],"robot":[15],"collaboration,":[16],"drone":[17],"formation":[18],"flight,":[19],"and":[20,39,89,98,112,137,149],"logistics":[21],"systems.":[22],"Compared":[23],"with":[24,61],"traditional":[25],"planning":[26],"methods,":[27],"the":[28,35,52,67,73,121,144,151,162],"method":[29],"using":[30],"reinforcement":[32,164],"learning":[33,165],"characteristics":[36],"of":[37,69,75,147],"real-time":[38],"distributed.":[40],"A":[41],"fundamental":[42],"challenge":[43],"obtaining":[45],"a":[46,82,102,117],"collision-free":[47],"navigation":[48,108,122,148,166],"strategy":[49,123],"is":[50,124,159],"that":[51,132],"agents":[53,76],"need":[54],"to":[55,57,59,77,87],"learn":[56],"cooperate":[58],"deal":[60],"congestion.":[62],"However,":[63],"existing":[64,163],"methods":[65],"have":[66,130],"defects":[68],"low":[70,90],"communication":[71,111,135],"efficiency,":[72],"inability":[74],"obtain":[78],"environmental":[79],"information":[80],"timely":[83],"manner,":[84],"which":[85],"leads":[86],"collisions":[88],"success":[91,145],"rates.":[92],"This":[93],"paper":[94],"introduces":[95],"Mutual":[96],"Information":[97],"Trajectory-Awared":[99],"Network":[100],"(MI-TAN),":[101],"novel":[103],"framework":[104],"for":[105,126],"enhancing":[106],"through":[109],"dynamic":[110],"intrinsic":[113],"exploration":[114],"rewards.":[115],"Using":[116],"distributed":[118],"training":[119],"method,":[120],"learned":[125],"each":[127],"agent.":[128],"Experiments":[129],"shown":[131],"while":[133],"improving":[134],"efficiency":[136],"encouraging":[138],"efficient":[139],"exploration,":[140],"it":[141],"also":[142],"improves":[143],"rate":[146,153],"reduces":[150],"collision":[152],"between":[154],"agents.":[155],"average":[157],"performance":[158],"better":[160],"than":[161],"method.":[167]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-14T00:00:00"}
