{"id":"https://openalex.org/W3121294994","doi":"https://doi.org/10.1109/globecom42002.2020.9322446","title":"Value Decomposition based Multi-Task Multi-Agent Deep Reinforcement Learning in Vehicular Networks","display_name":"Value Decomposition based Multi-Task Multi-Agent Deep Reinforcement Learning in Vehicular Networks","publication_year":2020,"publication_date":"2020-12-01","ids":{"openalex":"https://openalex.org/W3121294994","doi":"https://doi.org/10.1109/globecom42002.2020.9322446","mag":"3121294994"},"language":"en","primary_location":{"id":"doi:10.1109/globecom42002.2020.9322446","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom42002.2020.9322446","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2020 - 2020 IEEE Global Communications Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101846831","display_name":"Shilin Xu","orcid":"https://orcid.org/0000-0002-5249-0035"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shilin Xu","raw_affiliation_strings":["Beijing Laboratory of Advanced Information Networks, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Laboratory of Advanced Information Networks, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058648594","display_name":"Caili Guo","orcid":"https://orcid.org/0000-0001-8892-4520"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Caili Guo","raw_affiliation_strings":["Beijing Laboratory of Advanced Information Networks, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Laboratory of Advanced Information Networks, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057118326","display_name":"Rose Qingyang Hu","orcid":"https://orcid.org/0000-0002-1571-3631"},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rose Qingyang Hu","raw_affiliation_strings":["Utah State University, UT, USA"],"affiliations":[{"raw_affiliation_string":"Utah State University, UT, USA","institution_ids":["https://openalex.org/I121980950"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073527013","display_name":"Yi Qian","orcid":"https://orcid.org/0000-0001-5671-916X"},"institutions":[{"id":"https://openalex.org/I114395901","display_name":"University of Nebraska\u2013Lincoln","ror":"https://ror.org/043mer456","country_code":"US","type":"education","lineage":["https://openalex.org/I114395901"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Qian","raw_affiliation_strings":["University of Nebraska-Lincoln, Omaha, USA"],"affiliations":[{"raw_affiliation_string":"University of Nebraska-Lincoln, Omaha, USA","institution_ids":["https://openalex.org/I114395901"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101846831"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.3082,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.58657451,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10761","display_name":"Vehicular Ad Hoc Networks (VANETs)","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10761","display_name":"Vehicular Ad Hoc Networks (VANETs)","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.9729999899864197,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9729999899864197,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9212723970413208},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6995543241500854},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.6594878435134888},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6349087953567505},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.5280053615570068},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49255046248435974},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2514570355415344},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11244064569473267}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9212723970413208},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6995543241500854},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.6594878435134888},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6349087953567505},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.5280053615570068},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49255046248435974},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2514570355415344},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11244064569473267},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/globecom42002.2020.9322446","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom42002.2020.9322446","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2020 - 2020 IEEE Global Communications Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4000000059604645,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G4710853384","display_name":null,"funder_award_id":"2018YFB1800805","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5181277069","display_name":null,"funder_award_id":"4202049","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"}],"funders":[{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1757796397","https://openalex.org/W2097381042","https://openalex.org/W2604427121","https://openalex.org/W2604873668","https://openalex.org/W2624731731","https://openalex.org/W2626637010","https://openalex.org/W2765172389","https://openalex.org/W2889540440","https://openalex.org/W2908261578","https://openalex.org/W2909706750","https://openalex.org/W2950892788","https://openalex.org/W2951896791","https://openalex.org/W2963334314","https://openalex.org/W3012492598","https://openalex.org/W3049635259","https://openalex.org/W4298857966","https://openalex.org/W6637967152","https://openalex.org/W6674600207","https://openalex.org/W6736372492","https://openalex.org/W6736572398","https://openalex.org/W6739516088","https://openalex.org/W6781899394"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W2366903352"],"abstract_inverted_index":{"With":[0],"the":[1,53,61,69,79,82,86,105,113,119,155,171,174],"development":[2],"of":[3,10,29,73,104,173],"intelligent":[4],"transportation":[5],"system":[6],"(ITS),":[7],"a":[8,27,32,36,48,146],"multitude":[9],"novel":[11],"vehicular":[12,33,109,167],"applications":[13],"have":[14],"been":[15],"emerging.":[16],"There":[17],"is":[18,46],"an":[19,162],"urgent":[20],"need":[21],"for":[22],"simultaneously":[23],"supporting":[24],"multi-tasks":[25],"across":[26],"group":[28],"vehicles":[30],"in":[31,78,85,140],"network,":[34],"forming":[35],"typical":[37],"multi-task":[38],"multi-agent":[39],"(MTMA)":[40],"environment.":[41],"Deep":[42],"Reinforcement":[43],"Learning":[44],"(DRL)":[45],"deemed":[47],"promising":[49],"approach":[50],"to":[51,60,95,117,169],"solving":[52],"highly":[54],"complicated":[55,120],"MTMA":[56,80,163],"problem.":[57],"However,":[58],"owing":[59],"extraordinarily":[62],"growing":[63],"computational":[64],"complexity":[65],"as":[66,68],"well":[67],"explosively":[70],"increasing":[71],"dimension":[72],"state":[74,148],"and":[75,91,127,142,149],"action":[76,150],"spaces":[77],"environment,":[81],"value":[83,121],"functions":[84],"DRL":[87],"are":[88],"usually":[89],"bulky":[90],"could":[92],"be":[93,96],"difficult":[94],"learned":[97],"efficiently.":[98],"In":[99,157],"this":[100,158],"way,":[101],"by":[102],"virtue":[103],"correlations":[106],"among":[107],"multiple":[108],"tasks,":[110],"we":[111,160],"adopt":[112],"value-decomposition":[114],"mechanism":[115,176],"(VDM)":[116],"decompose":[118],"function":[122],"into":[123],"several":[124],"small":[125],"pieces":[126],"then":[128],"compute":[129],"each":[130],"sub-function":[131],"separately.":[132],"The":[133],"proposed":[134,175],"paradigm":[135],"can":[136],"yield":[137],"great":[138],"speed-up":[139],"learning":[141],"help":[143],"substantially":[144],"with":[145,165,177],"smaller":[147],"space":[151],"but":[152],"without":[153],"degrading":[154],"performance.":[156],"work,":[159],"consider":[161],"environment":[164],"three":[166],"tasks":[168],"demonstrate":[170],"effectiveness":[172],"simulation":[178],"results.":[179]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
