{"id":"https://openalex.org/W2794194662","doi":"https://doi.org/10.1080/03610918.2018.1433844","title":"The pitfall of instrumental variables in big data: What the rule of thumb can't give you","display_name":"The pitfall of instrumental variables in big data: What the rule of thumb can't give you","publication_year":2018,"publication_date":"2018-02-12","ids":{"openalex":"https://openalex.org/W2794194662","doi":"https://doi.org/10.1080/03610918.2018.1433844","mag":"2794194662"},"language":"en","primary_location":{"id":"doi:10.1080/03610918.2018.1433844","is_oa":false,"landing_page_url":"https://doi.org/10.1080/03610918.2018.1433844","pdf_url":null,"source":{"id":"https://openalex.org/S153329750","display_name":"Communications in Statistics - Simulation and Computation","issn_l":"0361-0918","issn":["0361-0918","1532-4141"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Statistics - Simulation and Computation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079095481","display_name":"Hui Shao","orcid":"https://orcid.org/0000-0002-4088-546X"},"institutions":[{"id":"https://openalex.org/I114832834","display_name":"Tulane University","ror":"https://ror.org/04vmvtb21","country_code":"US","type":"education","lineage":["https://openalex.org/I114832834"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hui Shao","raw_affiliation_strings":["Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States"],"affiliations":[{"raw_affiliation_string":"Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States","institution_ids":["https://openalex.org/I114832834"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008746595","display_name":"Charles Stoecker","orcid":"https://orcid.org/0000-0001-5438-9312"},"institutions":[{"id":"https://openalex.org/I114832834","display_name":"Tulane University","ror":"https://ror.org/04vmvtb21","country_code":"US","type":"education","lineage":["https://openalex.org/I114832834"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Charles Stoecker","raw_affiliation_strings":["Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States"],"affiliations":[{"raw_affiliation_string":"Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States","institution_ids":["https://openalex.org/I114832834"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101662379","display_name":"Shuang Yang","orcid":"https://orcid.org/0000-0003-0714-2856"},"institutions":[{"id":"https://openalex.org/I114832834","display_name":"Tulane University","ror":"https://ror.org/04vmvtb21","country_code":"US","type":"education","lineage":["https://openalex.org/I114832834"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shuang Yang","raw_affiliation_strings":["Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States"],"affiliations":[{"raw_affiliation_string":"Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States","institution_ids":["https://openalex.org/I114832834"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069523303","display_name":"Lizheng Shi","orcid":"https://orcid.org/0000-0002-7827-6766"},"institutions":[{"id":"https://openalex.org/I114832834","display_name":"Tulane University","ror":"https://ror.org/04vmvtb21","country_code":"US","type":"education","lineage":["https://openalex.org/I114832834"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lizheng Shi","raw_affiliation_strings":["Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States"],"affiliations":[{"raw_affiliation_string":"Tulane University Department of Global Health Management and Policy, Louisiana, New Orleans, United States","institution_ids":["https://openalex.org/I114832834"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5069523303"],"corresponding_institution_ids":["https://openalex.org/I114832834"],"apc_list":null,"apc_paid":null,"fwci":0.3431,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.50111612,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":"48","issue":"7","first_page":"2118","last_page":"2124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13487","display_name":"Statistical and numerical algorithms","score":0.9599000215530396,"subfield":{"id":"https://openalex.org/subfields/2604","display_name":"Applied Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13487","display_name":"Statistical and numerical algorithms","score":0.9599000215530396,"subfield":{"id":"https://openalex.org/subfields/2604","display_name":"Applied Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11918","display_name":"Forecasting Techniques and Applications","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9433000087738037,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rule-of-thumb","display_name":"Rule of thumb","score":0.7782361507415771},{"id":"https://openalex.org/keywords/instrumental-variable","display_name":"Instrumental variable","score":0.7361636161804199},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.6372488737106323},{"id":"https://openalex.org/keywords/null-hypothesis","display_name":"Null hypothesis","score":0.5568404197692871},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.536481499671936},{"id":"https://openalex.org/keywords/statistic","display_name":"Statistic","score":0.5038298964500427},{"id":"https://openalex.org/keywords/multiple-comparisons-problem","display_name":"Multiple comparisons problem","score":0.4990510940551758},{"id":"https://openalex.org/keywords/test-statistic","display_name":"Test statistic","score":0.48345503211021423},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.47532063722610474},{"id":"https://openalex.org/keywords/type-i-and-type-ii-errors","display_name":"Type I and type II errors","score":0.46252474188804626},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.45540153980255127},{"id":"https://openalex.org/keywords/point-estimation","display_name":"Point estimation","score":0.43131306767463684},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4281829595565796},{"id":"https://openalex.org/keywords/statistical-hypothesis-testing","display_name":"Statistical hypothesis testing","score":0.42036139965057373},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4117926359176636},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2850004732608795},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.25963494181632996}],"concepts":[{"id":"https://openalex.org/C89246107","wikidata":"https://www.wikidata.org/wiki/Q1398821","display_name":"Rule of thumb","level":2,"score":0.7782361507415771},{"id":"https://openalex.org/C162144332","wikidata":"https://www.wikidata.org/wiki/Q1665305","display_name":"Instrumental variable","level":2,"score":0.7361636161804199},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.6372488737106323},{"id":"https://openalex.org/C191988596","wikidata":"https://www.wikidata.org/wiki/Q628374","display_name":"Null hypothesis","level":2,"score":0.5568404197692871},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.536481499671936},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.5038298964500427},{"id":"https://openalex.org/C183905921","wikidata":"https://www.wikidata.org/wiki/Q1038757","display_name":"Multiple comparisons problem","level":2,"score":0.4990510940551758},{"id":"https://openalex.org/C169857963","wikidata":"https://www.wikidata.org/wiki/Q1461038","display_name":"Test statistic","level":3,"score":0.48345503211021423},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.47532063722610474},{"id":"https://openalex.org/C40696583","wikidata":"https://www.wikidata.org/wiki/Q989120","display_name":"Type I and type II errors","level":2,"score":0.46252474188804626},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.45540153980255127},{"id":"https://openalex.org/C41426520","wikidata":"https://www.wikidata.org/wiki/Q1192065","display_name":"Point estimation","level":2,"score":0.43131306767463684},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4281829595565796},{"id":"https://openalex.org/C87007009","wikidata":"https://www.wikidata.org/wiki/Q210832","display_name":"Statistical hypothesis testing","level":2,"score":0.42036139965057373},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4117926359176636},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2850004732608795},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25963494181632996},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1080/03610918.2018.1433844","is_oa":false,"landing_page_url":"https://doi.org/10.1080/03610918.2018.1433844","pdf_url":null,"source":{"id":"https://openalex.org/S153329750","display_name":"Communications in Statistics - Simulation and Computation","issn_l":"0361-0918","issn":["0361-0918","1532-4141"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Statistics - Simulation and Computation","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.4699999988079071}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W154531455","https://openalex.org/W2113330311","https://openalex.org/W1505944461","https://openalex.org/W104021676","https://openalex.org/W2106547200","https://openalex.org/W2113024102","https://openalex.org/W2057633723","https://openalex.org/W2075474943","https://openalex.org/W4200219293","https://openalex.org/W1967710610"],"abstract_inverted_index":{"Background:":[0],"Instrumental":[1],"variables":[2,285,328],"(IVs)":[3],"have":[4],"become":[5],"much":[6],"easier":[7],"to":[8,136,153,169,180,211,261,316],"find":[9],"in":[10,68,96,113,119,172,245,288,304],"the":[11,18,23,30,35,92,105,120,124,146,203,213,217,225,232,241,246,252,256,289,291,318,324],"\u201cBig":[12],"data":[13,140],"era\u201d":[14],"which":[15],"has":[16,42,46,271,279],"increased":[17,31,239,249],"number":[19,125,147,242,325],"of":[20,22,33,50,86,91,107,126,148,184,196,227,243,293,320,326],"applications":[21,98],"Two-Stage":[24],"Least":[25],"Squares":[26],"model":[27,122,192,220,248,259],"(TSLS).":[28],"With":[29],"availability":[32],"IVs,":[34],"possibility":[36],"that":[37,52,231],"these":[38],"IVs":[39,53,127,149,207,244,273],"are":[40],"weak":[41,110],"increased.":[43],"Prior":[44],"work":[45],"suggested":[47],"a":[48,55,65,132,194],"\u2018rule":[49,106,226,292,319],"thumb\u2019":[51,108,294],"with":[54,99,145],"first":[56,218,257],"stage":[57,219,258],"F":[58,214,253,312],"statistic":[59],"at":[60],"least":[61],"ten":[62],"will":[63],"avoid":[64],"relative":[66],"bias":[67],"point":[69,176],"estimates":[70],"greater":[71],"than":[72],"10%.":[73],"We":[74,130,229],"investigated":[75],"whether":[76],"or":[77],"not":[78],"this":[79,186],"threshold":[80],"was":[81,178,208,295],"also":[82],"an":[83,298],"efficient":[84,299],"guarantee":[85,300],"low":[87,115],"false":[88,116,197,233,264],"rejection":[89,117,173,198,234,265],"rates":[90,118,235],"null":[93],"hypothesis":[94,187,305],"test":[95,103],"TSLS":[97,121,247],"many":[100],"IVs.Objective:":[101],"To":[102],"how":[104],"for":[109,142,162,190,216,255,301,311],"instruments":[111],"performs":[112],"predicting":[114],"when":[123,240,269,277,323],"is":[128,314,329],"large.Method:":[129],"used":[131],"Monte":[133],"Carlo":[134],"approach":[135],"create":[137],"28":[138],"original":[139],"sets":[141],"different":[143],"models":[144],"varying":[150],"from":[151],"3":[152],"30.":[154],"For":[155],"each":[156,163,191],"model,":[157,290],"we":[158],"generated":[159],"2000":[160],"observations":[161],"iteration":[164],"and":[165,182,206,274],"conducted":[166],"50,000":[167],"iterations":[168],"reach":[170],"convergence":[171],"rates.":[174],"The":[175,200,263],"estimate":[177],"set":[179],"0,":[181],"probabilities":[183],"rejecting":[185],"were":[188,286],"recorded":[189],"as":[193],"measurement":[195],"rate.":[199],"relationship":[201],"between":[202],"endogenous":[204],"variable":[205],"carefully":[209],"adjusted":[210],"let":[212],"statistics":[215,254,313],"equal":[221,260],"ten,":[222],"thus":[223],"simulating":[224],"thumb.\u2019Results:":[228],"found":[230],"(type":[236],"I":[237],"errors)":[238],"while":[250],"holding":[251],"10.":[262],"rate":[266],"exceeds":[267],"10%":[268],"TLSL":[270,278],"24":[272],"exceed":[275],"15%":[276],"30":[280],"IVs.Conclusion:":[281],"When":[282],"more":[283,308],"instrumental":[284,327],"applied":[287],"no":[296],"longer":[297],"good":[302],"performance":[303],"testing.":[306],"A":[307],"restricted":[309],"margin":[310],"recommended":[315],"replace":[317],"thumb,\u2019":[321],"especially":[322],"large.":[330]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
