{"id":"https://openalex.org/W4381744268","doi":"https://doi.org/10.1109/cscwd57460.2023.10152759","title":"Multi-Agent Collaborative Behavior Decision-Making based on Deep Reinforcement Learning","display_name":"Multi-Agent Collaborative Behavior Decision-Making based on Deep Reinforcement Learning","publication_year":2023,"publication_date":"2023-05-24","ids":{"openalex":"https://openalex.org/W4381744268","doi":"https://doi.org/10.1109/cscwd57460.2023.10152759"},"language":"en","primary_location":{"id":"doi:10.1109/cscwd57460.2023.10152759","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cscwd57460.2023.10152759","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 26th International Conference on Computer Supported Cooperative Work in Design (CSCWD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112944037","display_name":"Xingze Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I7350606","display_name":"Dalian Jiaotong University","ror":"https://ror.org/05gp45n31","country_code":"CN","type":"education","lineage":["https://openalex.org/I7350606"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xingze Guo","raw_affiliation_strings":["Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","institution_ids":["https://openalex.org/I7350606"]},{"raw_affiliation_string":"School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China","institution_ids":["https://openalex.org/I7350606"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100416244","display_name":"Feng Gao","orcid":"https://orcid.org/0000-0002-8366-3605"},"institutions":[{"id":"https://openalex.org/I7350606","display_name":"Dalian Jiaotong University","ror":"https://ror.org/05gp45n31","country_code":"CN","type":"education","lineage":["https://openalex.org/I7350606"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Gao","raw_affiliation_strings":["Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","institution_ids":["https://openalex.org/I7350606"]},{"raw_affiliation_string":"School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China","institution_ids":["https://openalex.org/I7350606"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013055924","display_name":"Xiaojun Zheng","orcid":"https://orcid.org/0000-0003-4445-6256"},"institutions":[{"id":"https://openalex.org/I7350606","display_name":"Dalian Jiaotong University","ror":"https://ror.org/05gp45n31","country_code":"CN","type":"education","lineage":["https://openalex.org/I7350606"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojun Zheng","raw_affiliation_strings":["Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian Jiaotong University,School of Mechanical Engineering,Dalian,China","institution_ids":["https://openalex.org/I7350606"]},{"raw_affiliation_string":"School of Mechanical Engineering, Dalian Jiaotong University, Dalian, China","institution_ids":["https://openalex.org/I7350606"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003646046","display_name":"Shiduo Ning","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiduo Ning","raw_affiliation_strings":["Dalian University of Technology,School of Mechanical Engineering,Dalian,China","School of Mechanical Engineering, Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Mechanical Engineering,Dalian,China","institution_ids":["https://openalex.org/I27357992"]},{"raw_affiliation_string":"School of Mechanical Engineering, Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5112944037"],"corresponding_institution_ids":["https://openalex.org/I7350606"],"apc_list":null,"apc_paid":null,"fwci":0.8147,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.70160218,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"577","last_page":"581"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11500","display_name":"Evacuation and Crowd Dynamics","score":0.8474000096321106,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11500","display_name":"Evacuation and Crowd Dynamics","score":0.8474000096321106,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10734","display_name":"Information and Cyber Security","score":0.7684000134468079,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13832","display_name":"Advanced Decision-Making Techniques","score":0.7368999719619751,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8626645803451538},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7521429061889648},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7016775608062744},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6070656776428223},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5228232145309448},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.45401516556739807},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4375538229942322},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.4107872247695923},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.303937166929245},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2718944549560547}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8626645803451538},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7521429061889648},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7016775608062744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6070656776428223},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5228232145309448},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.45401516556739807},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4375538229942322},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.4107872247695923},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.303937166929245},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2718944549560547},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cscwd57460.2023.10152759","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cscwd57460.2023.10152759","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 26th International Conference on Computer Supported Cooperative Work in Design (CSCWD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7799999713897705}],"awards":[],"funders":[{"id":"https://openalex.org/F4320323086","display_name":"Natural Science Foundation of Liaoning Province","ror":null},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2386410636","https://openalex.org/W1985560493","https://openalex.org/W1626977535","https://openalex.org/W4284974072","https://openalex.org/W3096874164","https://openalex.org/W2357975469","https://openalex.org/W2937181779","https://openalex.org/W2182304831","https://openalex.org/W2145363145","https://openalex.org/W3168977894"],"abstract_inverted_index":{"For":[0],"the":[1,31,38,47,54,64,72,77,95,104,107,118,127],"problem":[2],"of":[3,33,49,97],"collaborative":[4,13,36,42,66,98,129],"decision-making,":[5],"we":[6,70],"propose":[7],"a":[8,18,23,84,136],"multi-agent":[9,65,128],"deep":[10,119],"reinforcement":[11,120],"learning":[12,121],"behavior":[14,67],"decision-making":[15],"algorithm.":[16],"Firstly,":[17],"discrete":[19],"state":[20],"space":[21,27],"and":[22,51,87,110],"greedy":[24],"strategy-based":[25],"action":[26],"are":[28,44],"established":[29,61],"in":[30,102,135],"context":[32],"multi-":[34],"agent":[35],"attack,":[37],"conditions":[39],"for":[40,46],"successful":[41],"siege":[43],"given":[45],"requirements":[48],"rapidity":[50],"collocation.":[52],"Secondly,":[53],"Markov":[55],"Decision":[56],"Process":[57],"(MDP)":[58],"framework":[59],"is":[60,91,123],"based":[62],"on":[63],"decision":[68,100],"algorithm,":[69],"introduce":[71],"experience":[73],"replay":[74],"to":[75,93,125],"train":[76],"neural":[78],"network":[79],"using":[80],"gradient":[81],"descent.":[82],"Finally,":[83],"centralized":[85],"training":[86,96],"distributed":[88],"execution":[89],"architecture":[90],"used":[92],"complete":[94],"behavioral":[99],"making,":[101],"which":[103],"agents":[105],"share":[106],"same":[108],"strategy":[109],"execute":[111],"actions":[112],"independently.":[113],"The":[114],"simulation":[115],"shows":[116],"that":[117],"algorithm":[122],"able":[124],"realize":[126],"decision.":[130],"It":[131],"can":[132],"be":[133],"placed":[134],"real":[137],"environment.":[138]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
