{"id":"https://openalex.org/W4414348330","doi":"https://doi.org/10.1109/tai.2025.3560617","title":"Investigating Primacy Bias in Multiagent Reinforcement Learning: An Empirical Study","display_name":"Investigating Primacy Bias in Multiagent Reinforcement Learning: An Empirical Study","publication_year":2025,"publication_date":"2025-09-19","ids":{"openalex":"https://openalex.org/W4414348330","doi":"https://doi.org/10.1109/tai.2025.3560617"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2025.3560617","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2025.3560617","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037024339","display_name":"Jingchen Li","orcid":"https://orcid.org/0000-0003-0905-0816"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingchen Li","raw_affiliation_strings":["School of Computer, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0003-0905-0816","affiliations":[{"raw_affiliation_string":"School of Computer, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102685950","display_name":"Yusen Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156423","display_name":"National Engineering Research Center for Information Technology in Agriculture","ror":"https://ror.org/04c3j3t84","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210156423"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yusen Yang","raw_affiliation_strings":["Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0003-4700-5757","affiliations":[{"raw_affiliation_string":"Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156423"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100613787","display_name":"Ziming He","orcid":"https://orcid.org/0009-0003-2218-8550"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziming He","raw_affiliation_strings":["School of Computer, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0009-0003-2218-8550","affiliations":[{"raw_affiliation_string":"School of Computer, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101355904","display_name":"Huarui Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156423","display_name":"National Engineering Research Center for Information Technology in Agriculture","ror":"https://ror.org/04c3j3t84","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210156423"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huarui Wu","raw_affiliation_strings":["Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6958-5065","affiliations":[{"raw_affiliation_string":"Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156423"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110031123","display_name":"Chunjiang Zhao","orcid":"https://orcid.org/0009-0005-6314-7661"},"institutions":[{"id":"https://openalex.org/I4210156423","display_name":"National Engineering Research Center for Information Technology in Agriculture","ror":"https://ror.org/04c3j3t84","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210156423"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunjiang Zhao","raw_affiliation_strings":["Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-6314-7661","affiliations":[{"raw_affiliation_string":"Information Technology Research Center, Beijing Academy of Agriculture and Forestry Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156423"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061189209","display_name":"Kao\u2010Shing Hwang","orcid":"https://orcid.org/0000-0001-9234-4836"},"institutions":[{"id":"https://openalex.org/I142974352","display_name":"National Sun Yat-sen University","ror":"https://ror.org/00mjawt10","country_code":"TW","type":"education","lineage":["https://openalex.org/I142974352"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kao-Shing Hwang","raw_affiliation_strings":["the Department of Electrical Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan"],"raw_orcid":"https://orcid.org/0000-0001-9234-4836","affiliations":[{"raw_affiliation_string":"the Department of Electrical Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan","institution_ids":["https://openalex.org/I142974352"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6348,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.87556357,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"7","issue":"4","first_page":"1874","last_page":"1882"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.3961000144481659,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.3961000144481659,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8083000183105469},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.8058000206947327},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.6416000127792358},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.5314000248908997},{"id":"https://openalex.org/keywords/phenomenon","display_name":"Phenomenon","score":0.46470001339912415},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.37630000710487366}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8083000183105469},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.8058000206947327},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.6416000127792358},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.5314000248908997},{"id":"https://openalex.org/C50335755","wikidata":"https://www.wikidata.org/wiki/Q483247","display_name":"Phenomenon","level":2,"score":0.46470001339912415},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.42410001158714294},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3905999958515167},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3675000071525574},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.35580000281333923},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33739998936653137},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.2603999972343445}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2025.3560617","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2025.3560617","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2141559645","https://openalex.org/W3026486560","https://openalex.org/W3081661003","https://openalex.org/W3155557419","https://openalex.org/W3206042616","https://openalex.org/W4206569030","https://openalex.org/W4319165238","https://openalex.org/W4377695283","https://openalex.org/W4392894584","https://openalex.org/W4394603098","https://openalex.org/W4397026139","https://openalex.org/W4399533021","https://openalex.org/W7133213525"],"related_works":[],"abstract_inverted_index":{"In":[0],"the":[1,5,22,25,33,59,79,85,112,125,136],"past":[2],"two":[3],"years,":[4],"phenomenon":[6],"of":[7,27,37,61,81,87,103],"<italic":[8,38,62,104],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[9,39,63,105],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">primacy":[10,40,64,106],"bias</i>":[11,41,107],"in":[12,42,108,118],"reinforcement":[13,28,44,55,120,137],"learning":[14,56,138],"has":[15],"been":[16],"extensively":[17],"investigated,":[18],"sparking":[19],"discussions":[20],"within":[21],"community":[23],"regarding":[24],"plasticity":[26],"learning.":[29,45,121],"This":[30],"study":[31],"represents":[32],"first":[34],"comprehensive":[35],"exploration":[36],"multiagent":[43],"Building":[46],"on":[47,94],"our":[48],"previous":[49],"works,":[50],"we":[51,123],"demonstrate":[52],"that":[53],"multi-agent":[54,96,109,141],"also":[57],"encounters":[58],"challenge":[60],"bias</i>.":[65],"We":[66,90],"then":[67],"provide":[68],"a":[69],"comparative":[70],"analysis":[71],"across":[72],"various":[73],"settings,":[74],"including":[75],"different":[76],"evaluation":[77],"methods,":[78],"sharing":[80],"policy":[82],"parameters,":[83],"and":[84,127],"adaptability":[86],"decentralized":[88],"policies.":[89],"conducted":[91],"extensive":[92],"experiments":[93],"multiple":[95],"benchmarks.":[97],"Our":[98],"findings":[99],"reveal":[100],"specific":[101],"characteristics":[102],"learning,":[110],"showing":[111],"difference":[113],"between":[114],"them":[115],"with":[116],"those":[117],"single-agent":[119],"While,":[122],"discuss":[124],"limitations":[126],"challenges":[128],"encountered":[129],"when":[130],"directly":[131],"applying":[132],"existing":[133],"solutions":[134],"from":[135],"domain":[139],"to":[140],"scenarios.":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
