{"id":"https://openalex.org/W4318719233","doi":"https://doi.org/10.48550/arxiv.2301.12802","title":"Planning Multiple Epidemic Interventions with Reinforcement Learning","display_name":"Planning Multiple Epidemic Interventions with Reinforcement Learning","publication_year":2023,"publication_date":"2023-01-30","ids":{"openalex":"https://openalex.org/W4318719233","doi":"https://doi.org/10.48550/arxiv.2301.12802"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2301.12802","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.12802","pdf_url":"https://arxiv.org/pdf/2301.12802","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2301.12802","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058307425","display_name":"Anh Mai","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mai, Anh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100311114","display_name":"Nikunj Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Nikunj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044418740","display_name":"Azza Abouzied","orcid":"https://orcid.org/0000-0003-4273-2536"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abouzied, Azza","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055576104","display_name":"Dennis Shasha","orcid":"https://orcid.org/0000-0002-7036-3312"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shasha, Dennis","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5058307425"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10410","display_name":"COVID-19 epidemiological studies","score":0.8689000010490417,"subfield":{"id":"https://openalex.org/subfields/2611","display_name":"Modeling and Simulation"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10410","display_name":"COVID-19 epidemiological studies","score":0.8689000010490417,"subfield":{"id":"https://openalex.org/subfields/2611","display_name":"Modeling and Simulation"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11810","display_name":"Complex Systems and Decision Making","score":0.8489000201225281,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10804","display_name":"Health Systems, Economic Evaluations, Quality of Life","score":0.805899977684021,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7842473983764648},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7550264596939087},{"id":"https://openalex.org/keywords/psychological-intervention","display_name":"Psychological intervention","score":0.722065806388855},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6191018223762512},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.570482075214386},{"id":"https://openalex.org/keywords/plan","display_name":"Plan (archaeology)","score":0.4996161460876465},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4744109809398651},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4697212278842926},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.39449137449264526},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3792378306388855},{"id":"https://openalex.org/keywords/management-science","display_name":"Management science","score":0.3771608769893646},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.3687335252761841},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.3517674207687378},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3443702459335327},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33001792430877686},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.17508721351623535},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1312527060508728},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.12047064304351807},{"id":"https://openalex.org/keywords/nursing","display_name":"Nursing","score":0.08489015698432922}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7842473983764648},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7550264596939087},{"id":"https://openalex.org/C27415008","wikidata":"https://www.wikidata.org/wiki/Q7256382","display_name":"Psychological intervention","level":2,"score":0.722065806388855},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6191018223762512},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.570482075214386},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.4996161460876465},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4744109809398651},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4697212278842926},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.39449137449264526},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3792378306388855},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3771608769893646},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3687335252761841},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.3517674207687378},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3443702459335327},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33001792430877686},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.17508721351623535},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1312527060508728},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.12047064304351807},{"id":"https://openalex.org/C159110408","wikidata":"https://www.wikidata.org/wiki/Q121176","display_name":"Nursing","level":1,"score":0.08489015698432922},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2301.12802","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.12802","pdf_url":"https://arxiv.org/pdf/2301.12802","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2301.12802","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2301.12802","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2301.12802","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.12802","pdf_url":"https://arxiv.org/pdf/2301.12802","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.8199999928474426,"id":"https://metadata.un.org/sdg/3","display_name":"Good health and well-being"}],"awards":[{"id":"https://openalex.org/G3288531224","display_name":null,"funder_award_id":"CG001","funder_id":"https://openalex.org/F4320330069","funder_display_name":"Tamkeen"},{"id":"https://openalex.org/G8833531855","display_name":null,"funder_award_id":"CG001","funder_id":"https://openalex.org/F4320313203","funder_display_name":"New York University Abu Dhabi"},{"id":"https://openalex.org/G974757083","display_name":null,"funder_award_id":"Tamkeen","funder_id":"https://openalex.org/F4320313203","funder_display_name":"New York University Abu Dhabi"}],"funders":[{"id":"https://openalex.org/F4320313203","display_name":"New York University Abu Dhabi","ror":"https://ror.org/00e5k0821"},{"id":"https://openalex.org/F4320330069","display_name":"Tamkeen","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4318719233.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894","https://openalex.org/W4225571923"],"abstract_inverted_index":{"Combating":[0],"an":[1,30,43,47],"epidemic":[2,31],"entails":[3],"finding":[4],"a":[5,80,87,99,178],"plan":[6,27,45],"that":[7,61,67,142,162],"describes":[8],"when":[9,74],"and":[10,39,70,82,89,136,155],"how":[11,126],"to":[12,110,127,138,159,181],"apply":[13,129],"different":[14],"interventions,":[15],"such":[16],"as":[17,98],"mask-wearing":[18],"mandates,":[19],"vaccinations,":[20],"school":[21],"or":[22],"workplace":[23],"closures.":[24],"An":[25],"optimal":[26,44],"will":[28],"curb":[29],"with":[32],"minimal":[33],"loss":[34],"of":[35,152,177],"life,":[36],"disease":[37,69,117],"burden,":[38],"economic":[40,71],"cost.":[41],"Finding":[42],"is":[46,105],"intractable":[48],"computational":[49,179],"problem":[50,97],"in":[51,107],"realistic":[52],"settings.":[53],"Policy-makers,":[54],"however,":[55],"would":[56],"greatly":[57],"benefit":[58],"from":[59],"tools":[60],"can":[62],"efficiently":[63],"search":[64,139],"for":[65,140],"plans":[66,141,164],"minimize":[68,143],"costs":[72],"especially":[73],"considering":[75],"multiple":[76,112],"possible":[77],"interventions":[78,114],"over":[79,115],"continuous":[81,88,113],"complex":[83,91],"action":[84],"space":[85],"given":[86],"equally":[90],"state":[92],"space.":[93],"We":[94,124,146],"formulate":[95],"this":[96],"Markov":[100],"decision":[101],"process.":[102],"Our":[103,168,172],"formulation":[104],"unique":[106],"its":[108],"ability":[109],"represent":[111],"any":[116],"model":[118],"defined":[119],"by":[120,166],"ordinary":[121],"differential":[122],"equations.":[123],"illustrate":[125],"effectively":[128],"state-of-the-art":[130],"actor-critic":[131],"reinforcement":[132],"learning":[133,150],"algorithms":[134,154],"(PPO":[135],"SAC)":[137],"overall":[144],"costs.":[145],"empirically":[147],"evaluate":[148],"the":[149,175],"performance":[151,158],"these":[153],"compare":[156],"their":[157],"hand-crafted":[160],"baselines":[161],"mimic":[163],"constructed":[165],"policy-makers.":[167],"method":[169],"outperforms":[170],"baselines.":[171],"work":[173],"confirms":[174],"viability":[176],"approach":[180],"support":[182],"policy-makers":[183]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
