{"id":"https://openalex.org/W3012628688","doi":"https://doi.org/10.1145/3366423.3380248","title":"Adversarial Cooperative Imitation Learning for Dynamic Treatment Regimes\u2731","display_name":"Adversarial Cooperative Imitation Learning for Dynamic Treatment Regimes\u2731","publication_year":2020,"publication_date":"2020-04-20","ids":{"openalex":"https://openalex.org/W3012628688","doi":"https://doi.org/10.1145/3366423.3380248","mag":"3012628688"},"language":"en","primary_location":{"id":"doi:10.1145/3366423.3380248","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380248","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3366423.3380248","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083964854","display_name":"Lu Wang","orcid":"https://orcid.org/0000-0002-7305-1496"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lu Wang","raw_affiliation_strings":["East China Normal University"],"affiliations":[{"raw_affiliation_string":"East China Normal University","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103210504","display_name":"Wenchao Yu","orcid":"https://orcid.org/0000-0002-2480-448X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wenchao Yu","raw_affiliation_strings":["NEC Laboratories America Inc"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America Inc","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101434435","display_name":"Xiaofeng He","orcid":"https://orcid.org/0000-0002-6911-348X"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaofeng He","raw_affiliation_strings":["East China Normal University"],"affiliations":[{"raw_affiliation_string":"East China Normal University","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046943571","display_name":"Wei Cheng","orcid":"https://orcid.org/0000-0002-1475-4079"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei Cheng","raw_affiliation_strings":["NEC Laboratories America Inc"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America Inc","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066274469","display_name":"Martin Renqiang Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martin Renqiang Ren","raw_affiliation_strings":["NEC Laboratories America Inc"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America Inc","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100392089","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0002-8180-2886"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["University of California Los Angeles"],"affiliations":[{"raw_affiliation_string":"University of California Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031597364","display_name":"Zong Bo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bo Zong","raw_affiliation_strings":["NEC Laboratories America Inc"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America Inc","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100456786","display_name":"Haifeng Chen","orcid":"https://orcid.org/0000-0002-9363-738X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haifeng Chen","raw_affiliation_strings":["NEC Laboratories America Inc"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America Inc","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046703129","display_name":"Hongyuan Zha","orcid":"https://orcid.org/0000-0001-7493-0911"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hongyuan Zha","raw_affiliation_strings":["Georgia Tech"],"affiliations":[{"raw_affiliation_string":"Georgia Tech","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5083964854"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":null,"apc_paid":null,"fwci":1.7233,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.87408691,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1785","last_page":"1795"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10845","display_name":"Advanced Causal Inference Techniques","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9473000168800354,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.8726178407669067},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7908680438995361},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.709416389465332},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6740108728408813},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.6691991090774536},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6424164772033691},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5521730184555054},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.43018242716789246},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.19837501645088196},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.09366658329963684}],"concepts":[{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.8726178407669067},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7908680438995361},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.709416389465332},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6740108728408813},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.6691991090774536},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6424164772033691},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5521730184555054},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.43018242716789246},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.19837501645088196},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.09366658329963684},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3366423.3380248","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380248","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3366423.3380248","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380248","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.75}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W139596442","https://openalex.org/W1515851193","https://openalex.org/W1600046456","https://openalex.org/W1809653203","https://openalex.org/W1999874108","https://openalex.org/W2051228319","https://openalex.org/W2062525454","https://openalex.org/W2098774185","https://openalex.org/W2099471712","https://openalex.org/W2142641780","https://openalex.org/W2165612525","https://openalex.org/W2171054284","https://openalex.org/W2187089797","https://openalex.org/W2280404143","https://openalex.org/W2396881363","https://openalex.org/W2575705757","https://openalex.org/W2619989803","https://openalex.org/W2744140371","https://openalex.org/W2751444262","https://openalex.org/W2787933113","https://openalex.org/W2788125442","https://openalex.org/W2806098286","https://openalex.org/W2808915113","https://openalex.org/W2896893468","https://openalex.org/W2899259578","https://openalex.org/W2962802563","https://openalex.org/W2962957031","https://openalex.org/W2963277051","https://openalex.org/W2963328631","https://openalex.org/W2963561234","https://openalex.org/W2963590100","https://openalex.org/W2964157711","https://openalex.org/W2985962305","https://openalex.org/W3103752844"],"related_works":["https://openalex.org/W2984518291","https://openalex.org/W4221150639","https://openalex.org/W3004128202","https://openalex.org/W4320854591","https://openalex.org/W4287871966","https://openalex.org/W4382203560","https://openalex.org/W3200833855","https://openalex.org/W3046843850","https://openalex.org/W4319083788","https://openalex.org/W2952541330"],"abstract_inverted_index":{"Recent":[0],"developments":[1],"in":[2,50,71,106],"discovering":[3],"dynamic":[4,122,196,218],"treatment":[5,24,123,197,219],"regimes":[6,124,220],"(DTRs)":[7],"have":[8],"heightened":[9],"the":[10,22,31,46,96,111,120,127,133,153,156,160,163,174,178,187,193,201,210,222],"importance":[11],"of":[12,88,212,224],"deep":[13],"reinforcement":[14,51],"learning":[15,52,74,115],"(DRL)":[16],"which":[17,85],"are":[18,54,69,86,139,189],"used":[19,140,171],"to":[20,91,118,141,151,172,191],"recover":[21],"doctor\u2019s":[23],"policies.":[25],"However,":[26],"existing":[27],"DRL-based":[28],"methods":[29,36],"expose":[30],"following":[32],"limitations:":[33],"1)":[34],"supervised":[35],"based":[37],"on":[38,200],"behavior":[39],"cloning":[40],"suffer":[41],"from":[42,132,159,177,186,226],"compounding":[43],"errors;":[44],"2)":[45],"self-defined":[47],"reward":[48,184],"signals":[49,185],"models":[53],"either":[55],"too":[56],"sparse":[57],"or":[58],"need":[59],"clinical":[60],"guidance;":[61],"3)":[62],"only":[63],"positive":[64,128,164,179,228],"trajectories":[65,78,129,157,176],"(e.g.":[66,79],"survived":[67],"patients)":[68,81],"considered":[70],"current":[72],"imitation":[73,114],"models,":[75],"with":[76,221],"negative":[77,134,175,230],"deceased":[80],"been":[82],"largely":[83],"ignored,":[84],"examples":[87],"what":[89],"not":[90],"do":[92],"and":[93,162,166,180,215,229],"could":[94],"help":[95,142],"learned":[97],"policy":[98,161,194],"avoid":[99],"repeating":[100],"mistakes.":[101],"To":[102],"address":[103],"these":[104],"limitations,":[105],"this":[107,144],"paper,":[108],"we":[109],"propose":[110],"adversarial":[112,147],"cooperative":[113,168],"model,":[116],"ACIL,":[117],"deduce":[119],"optimal":[121],"that":[125,207],"mimics":[126],"while":[130],"differs":[131],"trajectories.":[135,182,231],"Specifically,":[136],"two":[137],"discriminators":[138,188],"achieve":[143],"goal:":[145],"an":[146],"discriminator":[148,169],"is":[149,170],"designed":[150],"minimize":[152],"discrepancies":[154],"between":[155],"generated":[158,181],"trajectories,":[165],"a":[167],"distinguish":[173],"The":[183],"utilized":[190],"refine":[192],"for":[195],"regimes.":[198],"Experiments":[199],"publicly":[202],"real-world":[203],"medical":[204],"data":[205],"demonstrate":[206],"ACIL":[208],"improves":[209],"likelihood":[211],"patient":[213],"survival":[214],"provides":[216],"better":[217],"exploitation":[223],"information":[225],"both":[227]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
