{"id":"https://openalex.org/W3176140770","doi":"https://doi.org/10.1002/sam.11643","title":"Stratified learning: A general\u2010purpose statistical method for improved learning under covariate shift","display_name":"Stratified learning: A general\u2010purpose statistical method for improved learning under covariate shift","publication_year":2023,"publication_date":"2023-09-29","ids":{"openalex":"https://openalex.org/W3176140770","doi":"https://doi.org/10.1002/sam.11643","mag":"3176140770"},"language":"en","primary_location":{"id":"doi:10.1002/sam.11643","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1002/sam.11643","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/sam.11643","source":{"id":"https://openalex.org/S40788348","display_name":"Statistical Analysis and Data Mining The ASA Data Science Journal","issn_l":"1932-1864","issn":["1932-1864","1932-1872"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Statistical Analysis and Data Mining: The ASA Data Science Journal","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/sam.11643","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049505436","display_name":"Maximilian Autenrieth","orcid":"https://orcid.org/0009-0006-2068-5950"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Maximilian Autenrieth","raw_affiliation_strings":["Department of Mathematics Imperial College London  London UK","Department of Mathematics, Imperial College London, London, UK"],"raw_orcid":"https://orcid.org/0009-0006-2068-5950","affiliations":[{"raw_affiliation_string":"Department of Mathematics Imperial College London  London UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Department of Mathematics, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038831857","display_name":"David A. van Dyk","orcid":"https://orcid.org/0000-0002-0816-331X"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"David A. van Dyk","raw_affiliation_strings":["Department of Mathematics Imperial College London  London UK","Department of Mathematics, Imperial College London, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-0816-331X","affiliations":[{"raw_affiliation_string":"Department of Mathematics Imperial College London  London UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Department of Mathematics, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049262683","display_name":"Roberto Trotta","orcid":"https://orcid.org/0000-0002-3415-0707"},"institutions":[{"id":"https://openalex.org/I138549579","display_name":"Scuola Internazionale Superiore di Studi Avanzati","ror":"https://ror.org/004fze387","country_code":"IT","type":"education","lineage":["https://openalex.org/I138549579"]},{"id":"https://openalex.org/I3005160176","display_name":"Institute for High Performance Computing and Networking","ror":"https://ror.org/04r5fge26","country_code":"IT","type":"facility","lineage":["https://openalex.org/I3005160176","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB","IT"],"is_corresponding":false,"raw_author_name":"Roberto Trotta","raw_affiliation_strings":["Centro Nazionale \u201cHigh Performance Computer Big Data and Quantum Computing\u201d  Italy","Department of Physics Imperial College London  London UK","Department of Physics SISSA  Trieste Italy","Department of Physics, Imperial College London, London, UK","Department of Physics, SISSA, Trieste, Italy","Centro Nazionale \"High Performance Computer Big Data and Quantum Computing\", Italy"],"raw_orcid":"https://orcid.org/0000-0002-3415-0707","affiliations":[{"raw_affiliation_string":"Centro Nazionale \u201cHigh Performance Computer Big Data and Quantum Computing\u201d  Italy","institution_ids":["https://openalex.org/I3005160176"]},{"raw_affiliation_string":"Department of Physics Imperial College London  London UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Department of Physics SISSA  Trieste Italy","institution_ids":["https://openalex.org/I138549579"]},{"raw_affiliation_string":"Department of Physics, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Department of Physics, SISSA, Trieste, Italy","institution_ids":["https://openalex.org/I138549579"]},{"raw_affiliation_string":"Centro Nazionale \"High Performance Computer Big Data and Quantum Computing\", Italy","institution_ids":["https://openalex.org/I3005160176"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057162774","display_name":"David C. Stenning","orcid":"https://orcid.org/0000-0002-9761-4353"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"David C. Stenning","raw_affiliation_strings":["Department of Statistics and Actuarial Science Simon Fraser University  Burnaby British Columbia Canada","Department of Statistics and Actuarial Science, Simon Fraser University, Burnaby, British Columbia, Canada"],"raw_orcid":"https://orcid.org/0000-0002-9761-4353","affiliations":[{"raw_affiliation_string":"Department of Statistics and Actuarial Science Simon Fraser University  Burnaby British Columbia Canada","institution_ids":["https://openalex.org/I18014758"]},{"raw_affiliation_string":"Department of Statistics and Actuarial Science, Simon Fraser University, Burnaby, British Columbia, Canada","institution_ids":["https://openalex.org/I18014758"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5049505436"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":{"value":3760,"currency":"USD","value_usd":3760},"apc_paid":{"value":3760,"currency":"USD","value_usd":3760},"fwci":1.6466,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.83293519,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"17","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10243","display_name":"Statistical Methods and Bayesian Inference","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.924699068069458},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6306600570678711},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5850793719291687},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5659737586975098},{"id":"https://openalex.org/keywords/causal-inference","display_name":"Causal inference","score":0.5620622038841248},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.486102819442749},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4850884675979614},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4316613972187042},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.38212478160858154},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22751864790916443}],"concepts":[{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.924699068069458},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6306600570678711},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5850793719291687},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5659737586975098},{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.5620622038841248},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.486102819442749},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4850884675979614},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4316613972187042},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.38212478160858154},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22751864790916443},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1002/sam.11643","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1002/sam.11643","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/sam.11643","source":{"id":"https://openalex.org/S40788348","display_name":"Statistical Analysis and Data Mining The ASA Data Science Journal","issn_l":"1932-1864","issn":["1932-1864","1932-1872"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Statistical Analysis and Data Mining: The ASA Data Science Journal","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2106.11211","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2106.11211","pdf_url":"https://arxiv.org/pdf/2106.11211","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:spiral.imperial.ac.uk:10044/1/106453","is_oa":true,"landing_page_url":"http://hdl.handle.net/10044/1/106453","pdf_url":null,"source":{"id":"https://openalex.org/S4306401396","display_name":"Spiral (Imperial College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I47508984","host_organization_name":"Imperial College London","host_organization_lineage":["https://openalex.org/I47508984"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"}],"best_oa_location":{"id":"doi:10.1002/sam.11643","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1002/sam.11643","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1002/sam.11643","source":{"id":"https://openalex.org/S40788348","display_name":"Statistical Analysis and Data Mining The ASA Data Science Journal","issn_l":"1932-1864","issn":["1932-1864","1932-1872"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Statistical Analysis and Data Mining: The ASA Data Science Journal","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.41999998688697815,"display_name":"No poverty","id":"https://metadata.un.org/sdg/1"}],"awards":[{"id":"https://openalex.org/G1322596814","display_name":null,"funder_award_id":"ST/P000762/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"},{"id":"https://openalex.org/G344728634","display_name":null,"funder_award_id":"ST/T000791/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"},{"id":"https://openalex.org/G3558974111","display_name":null,"funder_award_id":"EP/W015080/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3619189227","display_name":null,"funder_award_id":"ST/S000372/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"},{"id":"https://openalex.org/G5081566999","display_name":"M-Theory, Cosmology and Quantum Field Theory","funder_award_id":"ST/P000762/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"},{"id":"https://openalex.org/G5431427016","display_name":null,"funder_award_id":"RGPIN\u20102021\u201003985","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"},{"id":"https://openalex.org/G8645909849","display_name":"M-Theory, Cosmology and Quantum Field Theory","funder_award_id":"ST/T000791/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334632","display_name":"Science and Technology Facilities Council","ror":"https://ror.org/057g20z61"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W3176140770.pdf"},"referenced_works_count":62,"referenced_works":["https://openalex.org/W189742998","https://openalex.org/W804362531","https://openalex.org/W1489126041","https://openalex.org/W1537066827","https://openalex.org/W1831050183","https://openalex.org/W1853767801","https://openalex.org/W2028040032","https://openalex.org/W2028138594","https://openalex.org/W2032536435","https://openalex.org/W2034368206","https://openalex.org/W2035404753","https://openalex.org/W2035481234","https://openalex.org/W2035956549","https://openalex.org/W2036193982","https://openalex.org/W2039232902","https://openalex.org/W2048470090","https://openalex.org/W2051554499","https://openalex.org/W2053537340","https://openalex.org/W2073832139","https://openalex.org/W2100534701","https://openalex.org/W2102689555","https://openalex.org/W2103459159","https://openalex.org/W2108018401","https://openalex.org/W2110818436","https://openalex.org/W2111078766","https://openalex.org/W2111362445","https://openalex.org/W2112483442","https://openalex.org/W2115403315","https://openalex.org/W2129092711","https://openalex.org/W2139122730","https://openalex.org/W2145550174","https://openalex.org/W2150291618","https://openalex.org/W2155982052","https://openalex.org/W2164498941","https://openalex.org/W2165698076","https://openalex.org/W2168639902","https://openalex.org/W2255883267","https://openalex.org/W2292579160","https://openalex.org/W2562469482","https://openalex.org/W2624682472","https://openalex.org/W2906986493","https://openalex.org/W2922961522","https://openalex.org/W2951810666","https://openalex.org/W2959412897","https://openalex.org/W2963271324","https://openalex.org/W2979509742","https://openalex.org/W2990138404","https://openalex.org/W3022547535","https://openalex.org/W3102681989","https://openalex.org/W3103235332","https://openalex.org/W3106384162","https://openalex.org/W3120740533","https://openalex.org/W3122193054","https://openalex.org/W3122659035","https://openalex.org/W3150893739","https://openalex.org/W4212774754","https://openalex.org/W4213367101","https://openalex.org/W4239728164","https://openalex.org/W4244364296","https://openalex.org/W4297791620","https://openalex.org/W6680521049","https://openalex.org/W6768738362"],"related_works":["https://openalex.org/W2180954594","https://openalex.org/W2052835778","https://openalex.org/W2985746494","https://openalex.org/W4206042385","https://openalex.org/W2049003611","https://openalex.org/W2511384863","https://openalex.org/W2080773131","https://openalex.org/W2096089271","https://openalex.org/W2923628599","https://openalex.org/W2905625059"],"abstract_inverted_index":{"Abstract":[0],"We":[1,28,85,97,117],"propose":[2],"a":[3,22,31],"simple,":[4],"statistically":[5],"principled,":[6],"and":[7,37,81,130],"theoretically":[8],"justified":[9],"method":[10,90,104],"to":[11,77,87],"improve":[12,132],"supervised":[13],"learning":[14],"when":[15],"the":[16,40,68,72,88,99,119,124],"training":[17],"set":[18],"is":[19,58],"not":[20],"representative,":[21],"situation":[23],"known":[24],"as":[25,91],"covariate":[26,43],"shift.":[27],"build":[29],"upon":[30,133],"well\u2010established":[32],"methodology":[33],"in":[34,110],"causal":[35],"inference":[36],"show":[38],"that":[39],"effects":[41],"of":[42,101,138],"shift":[44],"can":[45],"be":[46],"reduced":[47],"or":[48,94],"eliminated":[49],"by":[50,60,66],"conditioning":[51],"on":[52,71,105,123],"propensity":[53,74],"scores.":[54],"In":[55],"practice,":[56],"this":[57,102],"achieved":[59],"fitting":[61],"learners":[62],"within":[63],"strata":[64],"constructed":[65],"partitioning":[67],"data":[69],"based":[70],"estimated":[73],"scores,":[75],"leading":[76],"approximately":[78],"balanced":[79],"covariates":[80],"much\u2010improved":[82],"target":[83],"prediction.":[84],"refer":[86],"overall":[89],"Stratified":[92],"Learning,":[93],"StratLearn":[95],".":[96],"demonstrate":[98],"effectiveness":[100],"general\u2010purpose":[103],"two":[106],"contemporary":[107],"research":[108],"questions":[109],"cosmology,":[111],"outperforming":[112],"state\u2010of\u2010the\u2010art":[113],"importance":[114],"weighting":[115],"methods.":[116],"obtain":[118],"best\u2010reported":[120],"AUC":[121],"(0.958)":[122],"updated":[125],"\u201cSupernovae":[126],"photometric":[127],"classification":[128],"challenge,\u201d":[129],"we":[131],"existing":[134],"conditional":[135],"density":[136],"estimation":[137],"galaxy":[139],"redshift":[140],"from":[141],"Sloan":[142],"Digital":[143],"Sky":[144],"Survey":[145],"(SDSS)":[146],"data.":[147]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
