{"id":"https://openalex.org/W1774574844","doi":"https://doi.org/10.1109/tit.2016.2621111","title":"Two-Stage Sampling, Prediction and Adaptive Regression via Correlation Screening","display_name":"Two-Stage Sampling, Prediction and Adaptive Regression via Correlation Screening","publication_year":2016,"publication_date":"2016-10-25","ids":{"openalex":"https://openalex.org/W1774574844","doi":"https://doi.org/10.1109/tit.2016.2621111","mag":"1774574844"},"language":"en","primary_location":{"id":"doi:10.1109/tit.2016.2621111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tit.2016.2621111","pdf_url":null,"source":{"id":"https://openalex.org/S4502562","display_name":"IEEE Transactions on Information Theory","issn_l":"0018-9448","issn":["0018-9448","1557-9654"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Theory","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1502.06189","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Hamed Firouzi","orcid":"https://orcid.org/0000-0001-5418-2119"},"institutions":[{"id":"https://openalex.org/I40713646","display_name":"Goldman Sachs (United States)","ror":"https://ror.org/031rnv444","country_code":"US","type":"company","lineage":["https://openalex.org/I40713646"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hamed Firouzi","raw_affiliation_strings":["Goldman Sachs Group, New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"Goldman Sachs Group, New York, NY, USA","institution_ids":["https://openalex.org/I40713646"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Alfred O. Hero","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alfred O. Hero","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":null,"display_name":"Bala Rajaratnam","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]},{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bala Rajaratnam","raw_affiliation_strings":["Stanford University, Stanford, CA","UC Davis, Davis, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"UC Davis, Davis, CA","institution_ids":["https://openalex.org/I84218800"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I40713646"],"apc_list":null,"apc_paid":null,"fwci":1.4773,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.83026538,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"63","issue":"1","first_page":"698","last_page":"714"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.6251000165939331,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.6251000165939331,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.03959999978542328,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.024000000208616257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.5109999775886536},{"id":"https://openalex.org/keywords/linear-regression","display_name":"Linear regression","score":0.5008999705314636},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.5008000135421753},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.49459999799728394},{"id":"https://openalex.org/keywords/multivariate-statistics","display_name":"Multivariate statistics","score":0.477400004863739},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.4756999909877777},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4722999930381775},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.4072999954223633}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5986999869346619},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.5109999775886536},{"id":"https://openalex.org/C48921125","wikidata":"https://www.wikidata.org/wiki/Q10861030","display_name":"Linear regression","level":2,"score":0.5008999705314636},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.5008000135421753},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.49459999799728394},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.48739999532699585},{"id":"https://openalex.org/C161584116","wikidata":"https://www.wikidata.org/wiki/Q1952580","display_name":"Multivariate statistics","level":2,"score":0.477400004863739},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.4756999909877777},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4722999930381775},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.39910000562667847},{"id":"https://openalex.org/C2780092901","wikidata":"https://www.wikidata.org/wiki/Q3433612","display_name":"Correlation coefficient","level":2,"score":0.3849000036716461},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.37059998512268066},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.36399999260902405},{"id":"https://openalex.org/C2781395549","wikidata":"https://www.wikidata.org/wiki/Q4680762","display_name":"Adaptive sampling","level":3,"score":0.35530000925064087},{"id":"https://openalex.org/C167085575","wikidata":"https://www.wikidata.org/wiki/Q6803654","display_name":"Mean squared prediction error","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.31369999051094055},{"id":"https://openalex.org/C27574286","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Variables","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2973000109195709},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2890999913215637},{"id":"https://openalex.org/C129848803","wikidata":"https://www.wikidata.org/wiki/Q2564360","display_name":"Sample size determination","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2728999853134155},{"id":"https://openalex.org/C64946054","wikidata":"https://www.wikidata.org/wiki/Q4874476","display_name":"Bayesian multivariate linear regression","level":3,"score":0.26100000739097595},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tit.2016.2621111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tit.2016.2621111","pdf_url":null,"source":{"id":"https://openalex.org/S4502562","display_name":"IEEE Transactions on Information Theory","issn_l":"0018-9448","issn":["0018-9448","1557-9654"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Theory","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1502.06189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1502.06189","pdf_url":"https://arxiv.org/pdf/1502.06189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1502.06189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1502.06189","pdf_url":"https://arxiv.org/pdf/1502.06189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W100935669","https://openalex.org/W1558717344","https://openalex.org/W1583155004","https://openalex.org/W1750360268","https://openalex.org/W1970502168","https://openalex.org/W1985260835","https://openalex.org/W1993948873","https://openalex.org/W1994698330","https://openalex.org/W1997840761","https://openalex.org/W2008287878","https://openalex.org/W2016119924","https://openalex.org/W2022611944","https://openalex.org/W2037044380","https://openalex.org/W2039943102","https://openalex.org/W2063978378","https://openalex.org/W2106929598","https://openalex.org/W2109357213","https://openalex.org/W2109363337","https://openalex.org/W2109449402","https://openalex.org/W2116581300","https://openalex.org/W2125536150","https://openalex.org/W2125680629","https://openalex.org/W2127271355","https://openalex.org/W2127300249","https://openalex.org/W2130134073","https://openalex.org/W2135046866","https://openalex.org/W2138019504","https://openalex.org/W2141087758","https://openalex.org/W2154349465","https://openalex.org/W2154560360","https://openalex.org/W2156540265","https://openalex.org/W2160632209","https://openalex.org/W2164452299","https://openalex.org/W2166949820","https://openalex.org/W2321124713","https://openalex.org/W2951870768","https://openalex.org/W2952563653","https://openalex.org/W3022380717","https://openalex.org/W4230704549","https://openalex.org/W4247571494","https://openalex.org/W4250955649","https://openalex.org/W6633628318","https://openalex.org/W6639815595","https://openalex.org/W6675969814","https://openalex.org/W6678315064","https://openalex.org/W6680265217","https://openalex.org/W6683430545","https://openalex.org/W6724119101","https://openalex.org/W6727395519","https://openalex.org/W6730848393","https://openalex.org/W7066667914"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,52,58,63,73,142,180,187,202,227],"general":[4],"adaptive":[5,250],"procedure":[6],"for":[7,69,279,289],"budget-limited":[8],"predictor":[9,61,134,229],"design":[10],"in":[11,34,111,123],"high":[12,273,285],"dimensions":[13],"called":[14],"two-stage":[15],"Sampling,":[16],"Prediction":[17],"and":[18,39,133,269,292,301],"Adaptive":[19],"Regression":[20],"via":[21],"Correlation":[22],"Screening":[23],"(SPARCS).":[24],"The":[25,114,246],"SPARCS":[26,115,247],"can":[27],"be":[28],"applied":[29],"to":[30,50,56,125,179,265,272,298],"high-dimensional":[31],"prediction":[32],"problems":[33],"experimental":[35],"science,":[36],"medicine,":[37],"finance,":[38],"engineering,":[40],"as":[41],"illustrated":[42],"by":[43,232],"the":[44,99,103,117,137,165,174,197,212,217,220,224,234,243,259,280,299],"following.":[45],"Suppose":[46],"that":[47,98,215,253],"one":[48],"wishes":[49],"run":[51],"sequence":[53],"of":[54,62,77,101,106,171,176,189,208,211,219,242],"experiments":[55],"learn":[57],"sparse":[59],"multivariate":[60],"dependent":[64],"variable":[65],"Y":[66],"(disease":[67],"prognosis":[68],"instance)":[70],"based":[71],"on":[72,258],"p":[74,168,185],"dimensional":[75,286],"set":[76,105],"independent":[78],"variables":[79,107,177,214],"X":[80,87,108],"=":[81],"[X":[82],"<sub":[83,88,148,153,157],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[84,89,93,149,154,158,161],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sub>":[85],",...,":[86],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">p</sub>":[90],"]":[91],"<sup":[92,160],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">T</sup>":[94],"(assayed":[95],"biomarkers).":[96],"Assume":[97],"cost":[100,132],"acquiring":[102],"full":[104,166],"increases":[109],"linearly":[110],"its":[112],"dimension.":[113],"breaks":[116],"data":[118],"collection":[119],"into":[120],"two":[121],"stages":[122],"order":[124],"achieve":[126],"an":[127,249],"optimal":[128,294],"tradeoff":[129],"between":[130],"sampling":[131],"performance.":[135],"In":[136,196],"first":[138,221,300],"stage,":[139,199,226],"we":[140,200],"collect":[141,201],"few":[143],"(n)":[144],"expensive":[145],"samples":[146,210,241],"{y":[147],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i</sub>":[150,155],",":[151,163],"s":[152],"}":[156],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i=1</sub>":[159],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">n</sup>":[162],"at":[164],"dimension":[167,182],"\u226b":[169],"n":[170],"X,":[172],"winnowing":[173],"number":[175,204],"down":[178],"smaller":[181],"l":[183,213],"<;":[184],"using":[186,238],"type":[188],"cross":[190],"correlation":[191],"or":[192],"regression":[193,236],"coefficient":[194],"screening.":[195],"second":[198,225,302],"larger":[203],"(t":[205],"-":[206],"n)":[207],"cheaper":[209],"passed":[216],"screening":[218],"stage.":[222],"At":[223],"low-dimensional":[228],"is":[230,248,262,270],"constructed":[231],"solving":[233],"standard":[235],"problem":[237],"all":[239],"t":[240],"selected":[244,260],"variables.":[245],"online":[251],"algorithm":[252],"implements":[254],"false":[255],"positive":[256],"control":[257],"variables,":[261],"well":[263],"suited":[264],"small":[266],"sample":[267,295],"sizes,":[268],"scalable":[271],"dimensions.":[274],"We":[275],"establish":[276,293],"asymptotic":[277],"bounds":[278],"familywise":[281],"error":[282],"rate,":[283],"specify":[284],"convergence":[287],"rates":[288],"support":[290],"recovery,":[291],"allocation":[296],"rules":[297],"stages.":[303]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2016-06-24T00:00:00"}
