{"id":"https://openalex.org/W2135560932","doi":"https://doi.org/10.1109/adprl.2011.5967386","title":"An adaptive-learning framework for semi-cooperative multi-agent coordination","display_name":"An adaptive-learning framework for semi-cooperative multi-agent coordination","publication_year":2011,"publication_date":"2011-04-01","ids":{"openalex":"https://openalex.org/W2135560932","doi":"https://doi.org/10.1109/adprl.2011.5967386","mag":"2135560932"},"language":"en","primary_location":{"id":"doi:10.1109/adprl.2011.5967386","is_oa":false,"landing_page_url":"https://doi.org/10.1109/adprl.2011.5967386","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning (ADPRL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071638577","display_name":"Abdeslem Boukhtouta","orcid":null},"institutions":[{"id":"https://openalex.org/I1297460800","display_name":"Defence Research and Development Canada","ror":"https://ror.org/00hgy8d33","country_code":"CA","type":"funder","lineage":["https://openalex.org/I1297460800","https://openalex.org/I1336338359","https://openalex.org/I2802286613"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Abdeslem Boukhtouta","raw_affiliation_strings":["Defence Research and Development Canada, QUE, Canada","Defence Research & Development Canada, Valcartier, Quebec, G3J 1X5 Canada"],"affiliations":[{"raw_affiliation_string":"Defence Research and Development Canada, QUE, Canada","institution_ids":["https://openalex.org/I1297460800"]},{"raw_affiliation_string":"Defence Research & Development Canada, Valcartier, Quebec, G3J 1X5 Canada","institution_ids":["https://openalex.org/I1297460800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062247508","display_name":"Jean Berger","orcid":"https://orcid.org/0000-0001-5885-9254"},"institutions":[{"id":"https://openalex.org/I1297460800","display_name":"Defence Research and Development Canada","ror":"https://ror.org/00hgy8d33","country_code":"CA","type":"funder","lineage":["https://openalex.org/I1297460800","https://openalex.org/I1336338359","https://openalex.org/I2802286613"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jean Berger","raw_affiliation_strings":["Defence Research and Development Canada, QUE, Canada","Defence Research & Development Canada, Valcartier, Quebec, G3J 1X5 Canada"],"affiliations":[{"raw_affiliation_string":"Defence Research and Development Canada, QUE, Canada","institution_ids":["https://openalex.org/I1297460800"]},{"raw_affiliation_string":"Defence Research & Development Canada, Valcartier, Quebec, G3J 1X5 Canada","institution_ids":["https://openalex.org/I1297460800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054833334","display_name":"Warren B. Powell","orcid":"https://orcid.org/0000-0002-4364-7555"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Warren B. Powell","raw_affiliation_strings":["Department of Operations Research and Financial Engineering, Princeton University, Princeton, NJ, USA","Dept. of Operations Research & Financial Eng., Princeton University, NJ 08544, USA"],"affiliations":[{"raw_affiliation_string":"Department of Operations Research and Financial Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Dept. of Operations Research & Financial Eng., Princeton University, NJ 08544, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002736434","display_name":"Abraham George","orcid":"https://orcid.org/0000-0003-4535-1894"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abraham George","raw_affiliation_strings":["Department of Operations Research and Financial Engineering, Princeton University, Princeton, NJ, USA","Dept. of Operations Research & Financial Eng., Princeton University, NJ 08544, USA"],"affiliations":[{"raw_affiliation_string":"Department of Operations Research and Financial Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Dept. of Operations Research & Financial Eng., Princeton University, NJ 08544, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5071638577"],"corresponding_institution_ids":["https://openalex.org/I1297460800"],"apc_list":null,"apc_paid":null,"fwci":0.4402,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.7459817,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"2","issue":null,"first_page":"324","last_page":"331"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9865999817848206,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6882916688919067},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.6104606986045837},{"id":"https://openalex.org/keywords/ideal","display_name":"Ideal (ethics)","score":0.6033499836921692},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5591884851455688},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5562524795532227},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4490443766117096},{"id":"https://openalex.org/keywords/information-exchange","display_name":"Information exchange","score":0.4237365126609802},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.39629244804382324},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3356412947177887},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.3257367014884949},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1496695578098297},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.12872254848480225},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08183413743972778}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6882916688919067},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.6104606986045837},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.6033499836921692},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5591884851455688},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5562524795532227},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4490443766117096},{"id":"https://openalex.org/C189693848","wikidata":"https://www.wikidata.org/wiki/Q6031064","display_name":"Information exchange","level":2,"score":0.4237365126609802},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.39629244804382324},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3356412947177887},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3257367014884949},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1496695578098297},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.12872254848480225},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08183413743972778},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/adprl.2011.5967386","is_oa":false,"landing_page_url":"https://doi.org/10.1109/adprl.2011.5967386","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning (ADPRL)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.300.2482","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.300.2482","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.castlelab.princeton.edu/Papers/Berger Boukhtouta George Powell-Adaptive learning framework for semi-cooperative multi-agent coordinat.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5199999809265137,"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":101,"referenced_works":["https://openalex.org/W18322812","https://openalex.org/W21526160","https://openalex.org/W23115616","https://openalex.org/W63255316","https://openalex.org/W116417374","https://openalex.org/W117519490","https://openalex.org/W145683767","https://openalex.org/W165177707","https://openalex.org/W184585622","https://openalex.org/W993966725","https://openalex.org/W1480376833","https://openalex.org/W1481773530","https://openalex.org/W1481982958","https://openalex.org/W1483309316","https://openalex.org/W1486821414","https://openalex.org/W1488636191","https://openalex.org/W1506018624","https://openalex.org/W1525019474","https://openalex.org/W1530715683","https://openalex.org/W1553456369","https://openalex.org/W1556565823","https://openalex.org/W1565708010","https://openalex.org/W1569529949","https://openalex.org/W1569990960","https://openalex.org/W1571787852","https://openalex.org/W1574700590","https://openalex.org/W1576452626","https://openalex.org/W1578513650","https://openalex.org/W1587263632","https://openalex.org/W1601081659","https://openalex.org/W1601649239","https://openalex.org/W1612191182","https://openalex.org/W1795214984","https://openalex.org/W1854776945","https://openalex.org/W1888914589","https://openalex.org/W1982547713","https://openalex.org/W1983688269","https://openalex.org/W1996285291","https://openalex.org/W2002482313","https://openalex.org/W2008134955","https://openalex.org/W2038426159","https://openalex.org/W2040358553","https://openalex.org/W2047463693","https://openalex.org/W2063317370","https://openalex.org/W2065118686","https://openalex.org/W2075476358","https://openalex.org/W2076355050","https://openalex.org/W2092792265","https://openalex.org/W2099190243","https://openalex.org/W2100144172","https://openalex.org/W2104602264","https://openalex.org/W2105560970","https://openalex.org/W2108314197","https://openalex.org/W2109191620","https://openalex.org/W2109878893","https://openalex.org/W2117341272","https://openalex.org/W2123726099","https://openalex.org/W2132388847","https://openalex.org/W2142839172","https://openalex.org/W2146482048","https://openalex.org/W2147107304","https://openalex.org/W2147492008","https://openalex.org/W2149052950","https://openalex.org/W2151408086","https://openalex.org/W2155058860","https://openalex.org/W2159314501","https://openalex.org/W2160108997","https://openalex.org/W2170034549","https://openalex.org/W2170051340","https://openalex.org/W2171211995","https://openalex.org/W2181699502","https://openalex.org/W2319588593","https://openalex.org/W2324139981","https://openalex.org/W2334782222","https://openalex.org/W2487144912","https://openalex.org/W2736278702","https://openalex.org/W2770401204","https://openalex.org/W2911283634","https://openalex.org/W2914656440","https://openalex.org/W2936405433","https://openalex.org/W3109580747","https://openalex.org/W4241918052","https://openalex.org/W4307347247","https://openalex.org/W6600962046","https://openalex.org/W6604655690","https://openalex.org/W6604702912","https://openalex.org/W6607689547","https://openalex.org/W6625980573","https://openalex.org/W6628981685","https://openalex.org/W6633523339","https://openalex.org/W6634528131","https://openalex.org/W6639136740","https://openalex.org/W6649398222","https://openalex.org/W6675811377","https://openalex.org/W6681246212","https://openalex.org/W6683382367","https://openalex.org/W6684885968","https://openalex.org/W6686236104","https://openalex.org/W6689723076","https://openalex.org/W7010869870","https://openalex.org/W7038962950"],"related_works":["https://openalex.org/W2590472383","https://openalex.org/W2383873009","https://openalex.org/W2393580911","https://openalex.org/W2212184297","https://openalex.org/W3156456913","https://openalex.org/W2390945180","https://openalex.org/W2394052932","https://openalex.org/W2350360626","https://openalex.org/W2570940879","https://openalex.org/W2889555279"],"abstract_inverted_index":{"Complex":[0],"problems":[1],"involving":[2],"multiple":[3],"agents":[4,68,91],"exhibit":[5],"varying":[6],"degrees":[7],"of":[8,12,52,72,87,102],"cooperation.":[9],"The":[10,67],"levels":[11],"cooperation":[13],"might":[14],"reflect":[15],"both":[16],"differences":[17,23],"in":[18,24,60],"information":[19],"as":[20,22],"well":[21],"goals.":[25],"In":[26],"this":[27],"research,":[28],"we":[29],"develop":[30],"a":[31,41,57,113],"general":[32],"mathematical":[33],"model":[34],"for":[35],"distributed,":[36],"semi-cooperative":[37],"planning":[38],"and":[39,62,92],"suggest":[40],"solution":[42,98],"strategy":[43],"which":[44,53],"involves":[45],"decomposing":[46],"the":[47,85,90,97,103,107],"system":[48],"into":[49],"subproblems,":[50],"each":[51,75],"is":[54,110],"specified":[55],"at":[56],"certain":[58],"period":[59],"time":[61],"controlled":[63,111],"by":[64,112],"an":[65],"agent.":[66,115],"communicate":[69],"marginal":[70],"values":[71],"resources":[73],"to":[74,83],"other,":[76],"possibly":[77],"with":[78,95],"distortion.":[79],"We":[80],"design":[81],"experiments":[82],"demonstrate":[84],"benefits":[86],"communication":[88],"between":[89],"show":[93],"that,":[94],"communication,":[96],"quality":[99],"approaches":[100],"that":[101],"ideal":[104],"situation":[105],"where":[106],"entire":[108],"problem":[109],"single":[114]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
