{"id":"https://openalex.org/W7102791019","doi":"https://doi.org/10.48550/arxiv.2510.25128","title":"An Analysis of Causal Effect Estimation using Outcome Invariant Data Augmentation","display_name":"An Analysis of Causal Effect Estimation using Outcome Invariant Data Augmentation","publication_year":2025,"publication_date":"2025-10-29","ids":{"openalex":"https://openalex.org/W7102791019","doi":"https://doi.org/10.48550/arxiv.2510.25128"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2510.25128","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Akbar, Uzair","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Akbar, Uzair","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kilbertus, Niki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kilbertus, Niki","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Shen, Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Muandet, Krikamol","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muandet, Krikamol","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Dai, Bo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Bo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10845","display_name":"Advanced Causal Inference Techniques","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10845","display_name":"Advanced Causal Inference Techniques","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.005200000014156103,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.0019000000320374966,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/causal-inference","display_name":"Causal inference","score":0.7282999753952026},{"id":"https://openalex.org/keywords/instrumental-variable","display_name":"Instrumental variable","score":0.5659000277519226},{"id":"https://openalex.org/keywords/confounding","display_name":"Confounding","score":0.5295000076293945},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.505299985408783},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4941999912261963},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.49399998784065247},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4830999970436096},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.45570001006126404},{"id":"https://openalex.org/keywords/causal-model","display_name":"Causal model","score":0.44369998574256897},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.41830000281333923}],"concepts":[{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.7282999753952026},{"id":"https://openalex.org/C162144332","wikidata":"https://www.wikidata.org/wiki/Q1665305","display_name":"Instrumental variable","level":2,"score":0.5659000277519226},{"id":"https://openalex.org/C77350462","wikidata":"https://www.wikidata.org/wiki/Q1125472","display_name":"Confounding","level":2,"score":0.5295000076293945},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.505299985408783},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.49709999561309814},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4941999912261963},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.49399998784065247},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47510001063346863},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.45570001006126404},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.44369998574256897},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.43470001220703125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4287000000476837},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.41830000281333923},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.399399995803833},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C129848803","wikidata":"https://www.wikidata.org/wiki/Q2564360","display_name":"Sample size determination","level":2,"score":0.3450999855995178},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3255000114440918},{"id":"https://openalex.org/C163504300","wikidata":"https://www.wikidata.org/wiki/Q2364925","display_name":"Causal structure","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C117765406","wikidata":"https://www.wikidata.org/wiki/Q5362437","display_name":"Generalization error","level":3,"score":0.3181999921798706},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.29980000853538513},{"id":"https://openalex.org/C89337504","wikidata":"https://www.wikidata.org/wiki/Q4828276","display_name":"Average treatment effect","level":3,"score":0.2948000133037567},{"id":"https://openalex.org/C64357122","wikidata":"https://www.wikidata.org/wiki/Q1149766","display_name":"Causality (physics)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C27415008","wikidata":"https://www.wikidata.org/wiki/Q7256382","display_name":"Psychological intervention","level":2,"score":0.28780001401901245},{"id":"https://openalex.org/C155108698","wikidata":"https://www.wikidata.org/wiki/Q1231081","display_name":"Randomized experiment","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2696000039577484},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2549000084400177},{"id":"https://openalex.org/C27574286","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Variables","level":2,"score":0.25450000166893005},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.25450000166893005},{"id":"https://openalex.org/C40423286","wikidata":"https://www.wikidata.org/wiki/Q284172","display_name":"Selection bias","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2510.25128","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2510.25128","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.25128","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2510.25128","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"technique":[1],"of":[2,41,69,78,105,113,119,126,160,203],"data":[3,248],"augmentation":[4],"(DA)":[5],"is":[6,64,143,222],"often":[7],"used":[8,195],"in":[9,31,94,196],"machine":[10],"learning":[11],"for":[12,38,49,139,164,226,234],"regularization":[13],"purposes":[14],"to":[15,34,66,91,250],"better":[16],"generalize":[17],"under":[18],"i.i.d.":[19,46],"settings.":[20],"In":[21,102],"this":[22,148],"work,":[23],"we":[24,56,109,156,182],"present":[25,246],"a":[26,36,200,240],"unifying":[27],"framework":[28],"with":[29],"topics":[30],"causal":[32,95,210],"inference":[33],"make":[35,111],"case":[37,229,238],"the":[39,45,60,82,103,127,144,158,227,235],"use":[40,112],"DA":[42,138,185,218],"beyond":[43,215],"just":[44],"setting,":[47],"but":[48],"generalization":[50,213],"across":[51,172],"interventions":[52,80,173],"as":[53,79,134,137,186],"well.":[54],"Specifically,":[55],"argue":[57],"that":[58,122,193],"when":[59,175,194],"outcome":[61],"generating":[62,84],"mechanism":[63,85],"invariant":[65],"our":[67,252],"choice":[68],"DA,":[70,205],"then":[71],"such":[72,106,204],"augmentations":[73],"can":[74,88,198],"effectively":[75],"be":[76,133],"thought":[77],"on":[81,209],"treatment":[83,120],"itself.":[86],"This":[87,221],"potentially":[89],"help":[90],"reduce":[92],"bias":[93,167],"effect":[96],"estimation":[97,211],"arising":[98],"from":[99],"hidden":[100],"confounders.":[101],"presence":[104],"unobserved":[107],"confounding":[108,166],"typically":[110],"instrumental":[114],"variables":[115],"(IVs)":[116],"--":[117],"sources":[118],"randomization":[121],"are":[123,179],"conditionally":[124],"independent":[125],"outcome.":[128],"However,":[129],"IVs":[130],"may":[131,219],"not":[132],"readily":[135],"available":[136],"many":[140],"applications,":[141],"which":[142],"main":[145],"motivation":[146],"behind":[147],"work.":[149],"By":[150],"appropriately":[151],"regularizing":[152],"IV":[153,177],"based":[154],"estimators,":[155],"introduce":[157],"concept":[159],"IV-like":[161],"(IVL)":[162],"regression":[163,189],"mitigating":[165],"and":[168,191,212,230],"improving":[169,207],"predictive":[170],"performance":[171,208],"even":[174],"certain":[176],"properties":[178],"relaxed.":[180],"Finally,":[181],"cast":[183],"parameterized":[184],"an":[187],"IVL":[188],"problem":[190],"show":[192],"composition":[197],"simulate":[199],"worst-case":[201],"application":[202],"further":[206],"tasks":[214],"what":[216],"simple":[217,241],"offer.":[220],"shown":[223],"both":[224],"theoretically":[225],"population":[228],"via":[231],"simulation":[232],"experiments":[233,249],"finite":[236],"sample":[237],"using":[239],"linear":[242],"example.":[243],"We":[244],"also":[245],"real":[247],"support":[251],"case.":[253]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-31T00:00:00"}
