{"id":"https://openalex.org/W4400770834","doi":"https://doi.org/10.1109/access.2024.3430392","title":"Deep Multi-Agent Reinforcement Learning for Decentralized Active Hypothesis Testing","display_name":"Deep Multi-Agent Reinforcement Learning for Decentralized Active Hypothesis Testing","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4400770834","doi":"https://doi.org/10.1109/access.2024.3430392"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3430392","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3430392","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2024.3430392","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016627257","display_name":"Hadar Szostak","orcid":null},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Hadar Szostak","raw_affiliation_strings":["School of Electrical and Computer Engineering, Ben-Gurion University of the Negev, Be&#x2019;er Sheva, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Ben-Gurion University of the Negev, Be&#x2019;er Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066085947","display_name":"Kobi Cohen","orcid":"https://orcid.org/0000-0003-0532-009X"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Kobi Cohen","raw_affiliation_strings":["School of Electrical and Computer Engineering, Ben-Gurion University of the Negev, Be&#x2019;er Sheva, Israel"],"raw_orcid":"https://orcid.org/0000-0003-0532-009X","affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Ben-Gurion University of the Negev, Be&#x2019;er Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.7478,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.84481039,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"12","issue":null,"first_page":"130444","last_page":"130459"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.95169997215271,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9415000081062317,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7151252627372742},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.69707852602005},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5400370955467224},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44027066230773926},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.4154045581817627},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32118695974349976},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08104884624481201},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.07522299885749817}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7151252627372742},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.69707852602005},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5400370955467224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44027066230773926},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.4154045581817627},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32118695974349976},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08104884624481201},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07522299885749817}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3430392","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3430392","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:76aab702ac594c4aa50e29d07d1b7374","is_oa":true,"landing_page_url":"https://doaj.org/article/76aab702ac594c4aa50e29d07d1b7374","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 130444-130459 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3430392","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3430392","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G5755329095","display_name":null,"funder_award_id":"2640/20","funder_id":"https://openalex.org/F4320322252","funder_display_name":"Israel Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320322252","display_name":"Israel Science Foundation","ror":"https://ror.org/04sazxf24"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1977218919","https://openalex.org/W1978470213","https://openalex.org/W1990038735","https://openalex.org/W1990503235","https://openalex.org/W2019645207","https://openalex.org/W2045030310","https://openalex.org/W2070495730","https://openalex.org/W2077397896","https://openalex.org/W2082167858","https://openalex.org/W2101643234","https://openalex.org/W2145339207","https://openalex.org/W2153966789","https://openalex.org/W2166205892","https://openalex.org/W2291567910","https://openalex.org/W2498422553","https://openalex.org/W2512254099","https://openalex.org/W2552178850","https://openalex.org/W2736601468","https://openalex.org/W2743681928","https://openalex.org/W2746553466","https://openalex.org/W2811374584","https://openalex.org/W2896121142","https://openalex.org/W2903142609","https://openalex.org/W2912108923","https://openalex.org/W2945910721","https://openalex.org/W2963912378","https://openalex.org/W2974976221","https://openalex.org/W2986276296","https://openalex.org/W2991046523","https://openalex.org/W2999204576","https://openalex.org/W3009317244","https://openalex.org/W3012943290","https://openalex.org/W3046653923","https://openalex.org/W3046947688","https://openalex.org/W3047988770","https://openalex.org/W3099581246","https://openalex.org/W3099689767","https://openalex.org/W3103559770","https://openalex.org/W3110383331","https://openalex.org/W3148526481","https://openalex.org/W3167838998","https://openalex.org/W3187243030","https://openalex.org/W3195411792","https://openalex.org/W4232896127","https://openalex.org/W4283821341","https://openalex.org/W4285175639","https://openalex.org/W4293370731","https://openalex.org/W4308390426","https://openalex.org/W4323020881","https://openalex.org/W4367840085","https://openalex.org/W4386473229","https://openalex.org/W6634413486","https://openalex.org/W6638018090","https://openalex.org/W6712181171","https://openalex.org/W6732665253","https://openalex.org/W6741002519","https://openalex.org/W6752963931","https://openalex.org/W6780559895","https://openalex.org/W6838811763","https://openalex.org/W6852035933","https://openalex.org/W7025045700"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"We":[0,221],"consider":[1],"a":[2,39,55,73,82,109,128,132,166,208,223],"decentralized":[3],"formulation":[4,163],"of":[5,24,96,127,173,216,226,249,261,268],"the":[6,19,22,26,35,63,87,94,99,105,125,160,171,214,218,232,247,262,266],"active":[7],"hypothesis":[8,110],"testing":[9],"(AHT)":[10],"problem,":[11],"where":[12,65],"multiple":[13],"agents":[14,33,59,69,106],"gather":[15],"noisy":[16],"observations":[17,47],"from":[18,49],"environment":[20],"with":[21,54,213],"purpose":[23],"identifying":[25],"correct":[27],"hypothesis.":[28,57],"At":[29],"each":[30,52,189,194],"time":[31,190],"step,":[32],"have":[34,136,147],"option":[36],"to":[37,61,80,138,142,199,235],"select":[38],"sampling":[40,97],"action.":[41],"These":[42],"different":[43],"actions":[44],"result":[45],"in":[46,124,151,170,272],"drawn":[48],"various":[50],"distributions,":[51],"associated":[53],"specific":[56],"The":[58,77],"collaborate":[60],"accomplish":[62],"task,":[64],"message":[66],"exchanges":[67],"between":[68],"are":[70],"allowed":[71],"over":[72,251],"rate-limited":[74],"communications":[75],"channel.":[76],"objective":[78],"is":[79,119],"devise":[81],"multi-agent":[83,161,175],"policy":[84],"that":[85,229],"minimizes":[86],"Bayes":[88,219],"risk.":[89,220],"This":[90,178],"risk":[91],"comprises":[92],"both":[93],"cost":[95,102],"and":[98,239,270],"joint":[100],"terminal":[101],"incurred":[103],"by":[104,164,192],"upon":[107],"making":[108],"declaration.":[111],"Deriving":[112],"optimal":[113],"structured":[114],"policies":[115],"for":[116,184,265],"AHT":[117,162,185],"problems":[118],"generally":[120],"mathematically":[121],"intractable,":[122],"even":[123],"context":[126],"single":[129],"agent.":[130],"As":[131],"result,":[133],"recent":[134],"efforts":[135],"turned":[137],"deep":[139,174,210],"learning":[140,153,253],"methodologies":[141],"address":[143],"these":[144],"problems,":[145],"which":[146],"exhibited":[148],"significant":[149],"success":[150],"single-agent":[152,252],"scenarios.":[154],"In":[155],"this":[156],"paper,":[157],"we":[158,245,256],"tackle":[159],"introducing":[165],"novel":[167],"algorithm":[168],"rooted":[169],"framework":[172],"reinforcement":[176],"learning.":[177],"algorithm,":[179],"named":[180],"Multi-Agent":[181],"Reinforcement":[182],"Learning":[183],"(MARLA),":[186],"operates":[187],"at":[188],"step":[191],"having":[193],"agent":[195],"map":[196],"its":[197],"state":[198],"an":[200,258],"action":[201],"(sampling":[202],"rule":[203],"or":[204],"stopping":[205],"rule)":[206],"using":[207,242],"trained":[209],"neural":[211],"network":[212],"goal":[215],"minimizing":[217],"present":[222],"comprehensive":[224],"set":[225],"experimental":[227],"results":[228],"effectively":[230],"showcase":[231],"agents\u2019":[233],"ability":[234],"learn":[236],"collaborative":[237],"strategies":[238],"enhance":[240],"performance":[241],"MARLA.":[243],"Furthermore,":[244],"demonstrate":[246],"superiority":[248],"MARLA":[250,263],"approaches.":[254],"Finally,":[255],"provide":[257],"open-source":[259],"implementation":[260],"framework,":[264],"benefit":[267],"researchers":[269],"developers":[271],"related":[273],"domains.":[274]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
