{"id":"https://openalex.org/W3169424162","doi":"https://doi.org/10.1109/tpami.2022.3232363","title":"Invariant Policy Learning: A Causal Perspective","display_name":"Invariant Policy Learning: A Causal Perspective","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W3169424162","doi":"https://doi.org/10.1109/tpami.2022.3232363","mag":"3169424162","pmid":"https://pubmed.ncbi.nlm.nih.gov/37018267"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3232363","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3232363","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://curis.ku.dk/ws/files/374467912/Invariant_Policy_Learning.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052823119","display_name":"Sorawit Saengkyongam","orcid":"https://orcid.org/0000-0003-1581-259X"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Sorawit Saengkyongam","raw_affiliation_strings":["Department of Mathematical Sciences, University of Copenhagen, Denmark","Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0003-1581-259X","affiliations":[{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]},{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040183934","display_name":"Nikolaj Thams","orcid":"https://orcid.org/0000-0003-3961-5101"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Nikolaj Thams","raw_affiliation_strings":["Department of Mathematical Sciences, University of Copenhagen, Denmark","Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]},{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002127148","display_name":"Jonas Peters","orcid":"https://orcid.org/0000-0002-1487-7511"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Jonas Peters","raw_affiliation_strings":["Department of Mathematical Sciences, University of Copenhagen, Denmark","Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0002-1487-7511","affiliations":[{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]},{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044701034","display_name":"Niklas Pfister","orcid":"https://orcid.org/0000-0001-6203-9777"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Niklas Pfister","raw_affiliation_strings":["Department of Mathematical Sciences, University of Copenhagen, Denmark","Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0001-6203-9777","affiliations":[{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]},{"raw_affiliation_string":"Department of Mathematical Sciences, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6522,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.83854593,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"45","issue":"7","first_page":"1","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7348409295082092},{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.6589385271072388},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6573281288146973},{"id":"https://openalex.org/keywords/causality","display_name":"Causality (physics)","score":0.5766108632087708},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5733359456062317},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5458914637565613},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3969517946243286},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3274298906326294},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13497766852378845}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7348409295082092},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.6589385271072388},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6573281288146973},{"id":"https://openalex.org/C64357122","wikidata":"https://www.wikidata.org/wiki/Q1149766","display_name":"Causality (physics)","level":2,"score":0.5766108632087708},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5733359456062317},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5458914637565613},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3969517946243286},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3274298906326294},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13497766852378845},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tpami.2022.3232363","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3232363","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:37018267","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37018267","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/a440e450-e9a1-4243-af50-61b5ad147089","is_oa":true,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/a440e450-e9a1-4243-af50-61b5ad147089","pdf_url":"https://curis.ku.dk/ws/files/374467912/Invariant_Policy_Learning.pdf","source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Saengkyongam , S , Thams , N , Peters , J & Pfister , N 2023 , ' Invariant Policy Learning : A Causal Perspective ' , IEEE Transactions on Pattern Analysis and Machine Intelligence , vol. 45 , no. 7 , pp. 8606-8620 . https://doi.org/10.1109/TPAMI.2022.3232363","raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/a440e450-e9a1-4243-af50-61b5ad147089","is_oa":true,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/a440e450-e9a1-4243-af50-61b5ad147089","pdf_url":"https://curis.ku.dk/ws/files/374467912/Invariant_Policy_Learning.pdf","source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Saengkyongam , S , Thams , N , Peters , J & Pfister , N 2023 , ' Invariant Policy Learning : A Causal Perspective ' , IEEE Transactions on Pattern Analysis and Machine Intelligence , vol. 45 , no. 7 , pp. 8606-8620 . https://doi.org/10.1109/TPAMI.2022.3232363","raw_type":"article"},"sustainable_development_goals":[{"score":0.4699999988079071,"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land"}],"awards":[{"id":"https://openalex.org/G3077033437","display_name":null,"funder_award_id":"0069071","funder_id":"https://openalex.org/F4320325957","funder_display_name":"Novo Nordisk Fonden"},{"id":"https://openalex.org/G711721537","display_name":null,"funder_award_id":"18968","funder_id":"https://openalex.org/F4320310490","funder_display_name":"Villum Fonden"}],"funders":[{"id":"https://openalex.org/F4320310490","display_name":"Villum Fonden","ror":"https://ror.org/007ww2d15"},{"id":"https://openalex.org/F4320322436","display_name":"Novo Nordisk","ror":"https://ror.org/0435rc536"},{"id":"https://openalex.org/F4320325957","display_name":"Novo Nordisk Fonden","ror":"https://ror.org/04txyc737"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3169424162.pdf","grobid_xml":"https://content.openalex.org/works/W3169424162.grobid-xml"},"referenced_works_count":132,"referenced_works":["https://openalex.org/W1511751337","https://openalex.org/W1515782956","https://openalex.org/W1524326598","https://openalex.org/W1554015367","https://openalex.org/W1845972764","https://openalex.org/W1899161704","https://openalex.org/W2013567125","https://openalex.org/W2020160576","https://openalex.org/W2041282815","https://openalex.org/W2049910836","https://openalex.org/W2061554433","https://openalex.org/W2079062180","https://openalex.org/W2091825929","https://openalex.org/W2099471337","https://openalex.org/W2105897901","https://openalex.org/W2113065326","https://openalex.org/W2119850747","https://openalex.org/W2122124659","https://openalex.org/W2134779831","https://openalex.org/W2135046866","https://openalex.org/W2143891888","https://openalex.org/W2144020560","https://openalex.org/W2155858138","https://openalex.org/W2169315100","https://openalex.org/W2170400507","https://openalex.org/W2184746314","https://openalex.org/W2188353343","https://openalex.org/W2212660284","https://openalex.org/W2280421545","https://openalex.org/W2462906003","https://openalex.org/W2466989778","https://openalex.org/W2486285194","https://openalex.org/W2620289825","https://openalex.org/W2787023317","https://openalex.org/W2790376986","https://openalex.org/W2801890059","https://openalex.org/W2804232618","https://openalex.org/W2806187986","https://openalex.org/W2807644309","https://openalex.org/W2878791470","https://openalex.org/W2885305518","https://openalex.org/W2891404994","https://openalex.org/W2891620446","https://openalex.org/W2891765548","https://openalex.org/W2911964244","https://openalex.org/W2948579453","https://openalex.org/W2949367566","https://openalex.org/W2952428244","https://openalex.org/W2953494151","https://openalex.org/W2962736281","https://openalex.org/W2962875036","https://openalex.org/W2962935454","https://openalex.org/W2963062793","https://openalex.org/W2963448230","https://openalex.org/W2963608118","https://openalex.org/W2964250062","https://openalex.org/W2964297722","https://openalex.org/W2964311196","https://openalex.org/W2990645394","https://openalex.org/W2997261067","https://openalex.org/W2998548529","https://openalex.org/W3005930619","https://openalex.org/W3010488986","https://openalex.org/W3011651653","https://openalex.org/W3016824580","https://openalex.org/W3021834848","https://openalex.org/W3023021572","https://openalex.org/W3029947299","https://openalex.org/W3034932139","https://openalex.org/W3037700572","https://openalex.org/W3083684531","https://openalex.org/W3085744854","https://openalex.org/W3098163125","https://openalex.org/W3105003902","https://openalex.org/W3119520891","https://openalex.org/W3125697501","https://openalex.org/W3125774186","https://openalex.org/W3165503008","https://openalex.org/W3166322349","https://openalex.org/W3167514074","https://openalex.org/W3174040277","https://openalex.org/W3176138766","https://openalex.org/W3179971958","https://openalex.org/W3191453585","https://openalex.org/W3201699076","https://openalex.org/W3202150619","https://openalex.org/W3214040448","https://openalex.org/W4225659962","https://openalex.org/W4244473079","https://openalex.org/W4247128285","https://openalex.org/W4287178247","https://openalex.org/W4288287305","https://openalex.org/W4294016603","https://openalex.org/W4302423442","https://openalex.org/W6633172667","https://openalex.org/W6638280738","https://openalex.org/W6639610613","https://openalex.org/W6675240855","https://openalex.org/W6675601395","https://openalex.org/W6677102192","https://openalex.org/W6678113768","https://openalex.org/W6678276431","https://openalex.org/W6680096503","https://openalex.org/W6682789603","https://openalex.org/W6683124652","https://openalex.org/W6686823217","https://openalex.org/W6687328806","https://openalex.org/W6688325169","https://openalex.org/W6716227286","https://openalex.org/W6718836005","https://openalex.org/W6728912306","https://openalex.org/W6738737708","https://openalex.org/W6747999063","https://openalex.org/W6752160200","https://openalex.org/W6752252196","https://openalex.org/W6753717593","https://openalex.org/W6754586084","https://openalex.org/W6754927192","https://openalex.org/W6755551399","https://openalex.org/W6756923131","https://openalex.org/W6765285020","https://openalex.org/W6774121513","https://openalex.org/W6774858212","https://openalex.org/W6778306200","https://openalex.org/W6780260426","https://openalex.org/W6785383332","https://openalex.org/W6786117773","https://openalex.org/W6791482400","https://openalex.org/W6795862454","https://openalex.org/W6796681344","https://openalex.org/W6799730904","https://openalex.org/W6811080774"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W2018871932","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2081494945","https://openalex.org/W2389053294","https://openalex.org/W641279757"],"abstract_inverted_index":{"Contextual":[0],"bandit":[1],"and":[2,21,116,139,159],"reinforcement":[3],"learning":[4,13],"algorithms":[5],"have":[6,26],"been":[7],"successfully":[8],"used":[9],"in":[10,32,53,125,162],"various":[11],"interactive":[12],"systems":[14],"such":[15,36],"as":[16,37],"online":[17],"advertising,":[18],"recommender":[19],"systems,":[20,67],"dynamic":[22],"pricing.":[23],"However,":[24],"they":[25,57],"yet":[27],"to":[28,73,171],"be":[29,42],"widely":[30],"adopted":[31],"high-stakes":[33],"application":[34],"domains,":[35],"healthcare.":[38],"One":[39],"reason":[40],"may":[41,78],"that":[43,47,56,121,148,163],"existing":[44],"approaches":[45],"assume":[46],"the":[48,54,69,80,93,99,107,112,126,131,136,141],"underlying":[49,127],"mechanisms":[50,70],"are":[51,71,157],"static":[52,81],"sense":[55],"do":[58],"not":[59],"change":[60],"over":[61],"different":[62],"environments.":[63],"In":[64,84],"many":[65],"real-world":[66],"however,":[68],"subject":[72],"shifts":[74,97],"across":[75,173],"environments":[76,174],"which":[77],"invalidate":[79],"environment":[82],"assumption.":[83],"this":[85],"paper,":[86],"we":[87],"take":[88],"a":[89],"step":[90],"toward":[91],"tackling":[92],"problem":[94,110],"of":[95,101,114,133,143],"environmental":[96,108],"considering":[98],"framework":[100],"offline":[102],"contextual":[103,119],"bandits.":[104],"We":[105,129,146],"view":[106],"shift":[109],"through":[111],"lens":[113],"causality":[115,137],"propose":[117],"multi-environment":[118],"bandits":[120],"allow":[122],"for":[123],"changes":[124],"mechanisms.":[128],"adopt":[130],"concept":[132],"invariance":[134,150],"from":[135],"literature":[138],"introduce":[140],"notion":[142],"policy":[144,149,168],"invariance.":[145],"argue":[147],"is":[151,169],"only":[152],"relevant":[153],"if":[154],"unobserved":[155],"variables":[156],"present":[158],"show":[160],"that,":[161],"case,":[164],"an":[165],"optimal":[166],"invariant":[167],"guaranteed":[170],"generalize":[172],"under":[175],"suitable":[176],"assumptions.":[177]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
