{"id":"https://openalex.org/W2975703112","doi":"https://doi.org/10.1007/978-3-030-31978-6_8","title":"Deep Multi-agent Reinforcement Learning in a Homogeneous Open Population","display_name":"Deep Multi-agent Reinforcement Learning in a Homogeneous Open Population","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2975703112","doi":"https://doi.org/10.1007/978-3-030-31978-6_8","mag":"2975703112"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-31978-6_8","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-31978-6_8","pdf_url":null,"source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008556334","display_name":"Roxana R\u0103dulescu","orcid":"https://orcid.org/0000-0003-1446-5514"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Roxana R\u0103dulescu","raw_affiliation_strings":["Vrije Universiteit Brussel, Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022330197","display_name":"Manon Legrand","orcid":null},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Manon Legrand","raw_affiliation_strings":["Vrije Universiteit Brussel, Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056510473","display_name":"Kyriakos Efthymiadis","orcid":"https://orcid.org/0000-0002-2235-5115"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Kyriakos Efthymiadis","raw_affiliation_strings":["Vrije Universiteit Brussel, Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081436755","display_name":"Diederik M. Roijers","orcid":"https://orcid.org/0000-0002-2825-2491"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]},{"id":"https://openalex.org/I865915315","display_name":"Vrije Universiteit Amsterdam","ror":"https://ror.org/008xxew50","country_code":"NL","type":"education","lineage":["https://openalex.org/I865915315"]}],"countries":["BE","NL"],"is_corresponding":false,"raw_author_name":"Diederik M. Roijers","raw_affiliation_strings":["Vrije Universiteit Amsterdam, Amsterdam, The Netherlands","Vrije Universiteit Brussel, Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Amsterdam, Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I865915315"]},{"raw_affiliation_string":"Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064553018","display_name":"Ann Now\u00e9","orcid":"https://orcid.org/0000-0001-6346-4564"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Ann Now\u00e9","raw_affiliation_strings":["Vrije Universiteit Brussel, Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5008556334"],"corresponding_institution_ids":["https://openalex.org/I13469542"],"apc_list":null,"apc_paid":null,"fwci":3.3057,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.94182135,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"90","last_page":"105"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9769999980926514,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9452000260353088,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8673243522644043},{"id":"https://openalex.org/keywords/homogeneous","display_name":"Homogeneous","score":0.7685304880142212},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7394973635673523},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.6467702984809875},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6346759796142578},{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.537278950214386},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4743674695491791},{"id":"https://openalex.org/keywords/marl","display_name":"Marl","score":0.4257318377494812},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35022103786468506},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.33781129121780396},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33563342690467834},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10644423961639404},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09928643703460693},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.056894510984420776}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8673243522644043},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.7685304880142212},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7394973635673523},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.6467702984809875},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6346759796142578},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.537278950214386},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4743674695491791},{"id":"https://openalex.org/C92927620","wikidata":"https://www.wikidata.org/wiki/Q184053","display_name":"Marl","level":3,"score":0.4257318377494812},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35022103786468506},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33781129121780396},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33563342690467834},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10644423961639404},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09928643703460693},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.056894510984420776},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C109007969","wikidata":"https://www.wikidata.org/wiki/Q749565","display_name":"Structural basin","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1007/978-3-030-31978-6_8","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-31978-6_8","pdf_url":null,"source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},{"id":"pmh:oai:vubissmart:VUBISSMART:2000:119511","is_oa":false,"landing_page_url":"https://biblio.vub.ac.be/vubir/deep-multiagent-reinforcement-learning-in-a-homogeneous-open-population(6bad77bf-af31-4015-bdaf-a539a6bc3900).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306402573","display_name":"VUBIR (Vrije Universiteit Brussel)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I13469542","host_organization_name":"Vrije Universiteit Brussel","host_organization_lineage":["https://openalex.org/I13469542"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"publishedVersion"},{"id":"pmh:oai:research.vu.nl:openaire_cris_publications/d6b37f71-52f9-4448-8785-1f53847863f6","is_oa":false,"landing_page_url":"https://hdl.handle.net/1871.1/d6b37f71-52f9-4448-8785-1f53847863f6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"R\u0103dulescu, R, Legrand, M, Efthymiadis, K, Roijers, D M & Now\u00e9, A 2019, Deep Multi-agent Reinforcement Learning in a Homogeneous Open Population. in M Atzmueller & W Duivesteijn (eds), ARTIFICIAL INTELLIGENCE : 30th Benelux Conference, BNAIC 2018, Den Bosch November 8-9 2018, Revised Selected Papers. Communications in Computer and Information Science, vol. 1021, Springer, pp. 90-105, 30th Benelux Conference on Artificial Intelligence, BNAIC 2018, \u2018s-Hertogenbosch, Netherlands, 8/11/18. https://doi.org/10.1007/978-3-030-31978-6_8","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:vubissmart:VUBISSMART:2000:125078","is_oa":false,"landing_page_url":"https://biblio.vub.ac.be/vubir/deep-multiagent-reinforcement-learning-in-a-homogeneous-open-population(6d52b9b6-ca3a-4ee2-b844-2b0af78ed933).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306402573","display_name":"VUBIR (Vrije Universiteit Brussel)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I13469542","host_organization_name":"Vrije Universiteit Brussel","host_organization_lineage":["https://openalex.org/I13469542"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"},{"id":"pmh:vu:oai:research.vu.nl:publications/d6b37f71-52f9-4448-8785-1f53847863f6","is_oa":false,"landing_page_url":"https://research.vu.nl/en/publications/d6b37f71-52f9-4448-8785-1f53847863f6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ARTIFICIAL INTELLIGENCE: 30th Benelux Conference, BNAIC 2018, Den Bosch November 8-9 2018, Revised Selected Papers, 90 - 105","raw_type":"info:eu-repo/semantics/conferencepaper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320313460","display_name":"Agentschap Innoveren en Ondernemen","ror":"https://ror.org/032xdry56"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320327336","display_name":"Vlaamse regering","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W6043852","https://openalex.org/W103885025","https://openalex.org/W329015778","https://openalex.org/W1457482454","https://openalex.org/W1757796397","https://openalex.org/W1973039793","https://openalex.org/W2095705004","https://openalex.org/W2097381042","https://openalex.org/W2099618002","https://openalex.org/W2121863487","https://openalex.org/W2141559645","https://openalex.org/W2145339207","https://openalex.org/W2146502635","https://openalex.org/W2155968351","https://openalex.org/W2173248099","https://openalex.org/W2243485899","https://openalex.org/W2257979135","https://openalex.org/W2260756217","https://openalex.org/W2395575420","https://openalex.org/W2530195778","https://openalex.org/W2602275733","https://openalex.org/W2768629321","https://openalex.org/W2786036274","https://openalex.org/W2949608212","https://openalex.org/W2963053311","https://openalex.org/W2963407617","https://openalex.org/W2963802642","https://openalex.org/W2964043796","https://openalex.org/W3011120880","https://openalex.org/W3126753172","https://openalex.org/W3127772140","https://openalex.org/W4214717370","https://openalex.org/W6637967152"],"related_works":["https://openalex.org/W2126019709","https://openalex.org/W1702901972","https://openalex.org/W4249798507","https://openalex.org/W2069775250","https://openalex.org/W2475116013","https://openalex.org/W2152754392","https://openalex.org/W2066741154","https://openalex.org/W2196316523","https://openalex.org/W1989172970","https://openalex.org/W1899363654"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":3}],"updated_date":"2026-05-14T08:36:36.166977","created_date":"2025-10-10T00:00:00"}
