{"id":"https://openalex.org/W3199899101","doi":"https://doi.org/10.1080/10618600.2022.2130928","title":"Asynchronous and Distributed Data Augmentation for Massive Data Settings","display_name":"Asynchronous and Distributed Data Augmentation for Massive Data Settings","publication_year":2022,"publication_date":"2022-10-03","ids":{"openalex":"https://openalex.org/W3199899101","doi":"https://doi.org/10.1080/10618600.2022.2130928","mag":"3199899101"},"language":"en","primary_location":{"id":"doi:10.1080/10618600.2022.2130928","is_oa":false,"landing_page_url":"https://doi.org/10.1080/10618600.2022.2130928","pdf_url":null,"source":{"id":"https://openalex.org/S76159266","display_name":"Journal of Computational and Graphical Statistics","issn_l":"1061-8600","issn":["1061-8600","1537-2715"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computational and Graphical Statistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://figshare.com/articles/dataset/Asynchronous_and_Distributed_Data_Augmentation_for_Massive_Data_Settings/21263191","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100981161","display_name":"Jiayuan Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiayuan Zhou","raw_affiliation_strings":["Department of Statistics, University of Florida","Department of Statistics, University of Florida, Gainesville, FL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Statistics, University of Florida, Gainesville, FL","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070014481","display_name":"Kshitij Khare","orcid":"https://orcid.org/0000-0001-8595-7503"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kshitij Khare","raw_affiliation_strings":["Department of Statistics, University of Florida","Department of Statistics, University of Florida, Gainesville, FL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Statistics, University of Florida, Gainesville, FL","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049124418","display_name":"Sanvesh Srivastava","orcid":"https://orcid.org/0000-0002-5483-9579"},"institutions":[{"id":"https://openalex.org/I126307644","display_name":"University of Iowa","ror":"https://ror.org/036jqmy94","country_code":"US","type":"education","lineage":["https://openalex.org/I126307644"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sanvesh Srivastava","raw_affiliation_strings":["Department of Statistics and Actuarial Science, The University of Iowa","Department of Statistics and Actuarial Science, The University of Iowa, Iowa City, IA"],"raw_orcid":"https://orcid.org/0000-0002-5483-9579","affiliations":[{"raw_affiliation_string":"Department of Statistics and Actuarial Science, The University of Iowa","institution_ids":["https://openalex.org/I126307644"]},{"raw_affiliation_string":"Department of Statistics and Actuarial Science, The University of Iowa, Iowa City, IA","institution_ids":["https://openalex.org/I126307644"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049124418"],"corresponding_institution_ids":["https://openalex.org/I126307644"],"apc_list":null,"apc_paid":null,"fwci":0.2466,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53351516,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"32","issue":"3","first_page":"895","last_page":"907"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.72356778383255},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.7184032201766968},{"id":"https://openalex.org/keywords/fraction","display_name":"Fraction (chemistry)","score":0.6857969760894775},{"id":"https://openalex.org/keywords/ergodicity","display_name":"Ergodicity","score":0.6809564828872681},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5593553781509399},{"id":"https://openalex.org/keywords/disjoint-sets","display_name":"Disjoint sets","score":0.5372827649116516},{"id":"https://openalex.org/keywords/ergodic-theory","display_name":"Ergodic theory","score":0.5192932486534119},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3994753062725067},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3697296977043152},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.32325658202171326},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.25267964601516724},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.16595014929771423},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10307002067565918},{"id":"https://openalex.org/keywords/pure-mathematics","display_name":"Pure mathematics","score":0.0799945592880249}],"concepts":[{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.72356778383255},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.7184032201766968},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.6857969760894775},{"id":"https://openalex.org/C201779956","wikidata":"https://www.wikidata.org/wiki/Q5426803","display_name":"Ergodicity","level":2,"score":0.6809564828872681},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5593553781509399},{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.5372827649116516},{"id":"https://openalex.org/C122044880","wikidata":"https://www.wikidata.org/wiki/Q5498822","display_name":"Ergodic theory","level":2,"score":0.5192932486534119},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3994753062725067},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3697296977043152},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32325658202171326},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.25267964601516724},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.16595014929771423},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10307002067565918},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0799945592880249},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1080/10618600.2022.2130928","is_oa":false,"landing_page_url":"https://doi.org/10.1080/10618600.2022.2130928","pdf_url":null,"source":{"id":"https://openalex.org/S76159266","display_name":"Journal of Computational and Graphical Statistics","issn_l":"1061-8600","issn":["1061-8600","1537-2715"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computational and Graphical Statistics","raw_type":"journal-article"},{"id":"pmh:oai:figshare.com:article/21263191","is_oa":true,"landing_page_url":"https://figshare.com/articles/dataset/Asynchronous_and_Distributed_Data_Augmentation_for_Massive_Data_Settings/21263191","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dataset"},{"id":"doi:10.6084/m9.figshare.21263191.v1","is_oa":true,"landing_page_url":"https://doi.org/10.6084/m9.figshare.21263191.v1","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:figshare.com:article/21263191","is_oa":true,"landing_page_url":"https://figshare.com/articles/dataset/Asynchronous_and_Distributed_Data_Augmentation_for_Massive_Data_Settings/21263191","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dataset"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1326223872","display_name":null,"funder_award_id":"DMS-1854667/1854662","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G1940144667","display_name":null,"funder_award_id":"ONR-BAA N000141812741","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":72,"referenced_works":["https://openalex.org/W1499965417","https://openalex.org/W1599118604","https://openalex.org/W1686266550","https://openalex.org/W1878934793","https://openalex.org/W1897305366","https://openalex.org/W1982508956","https://openalex.org/W1985093013","https://openalex.org/W1988251813","https://openalex.org/W1988698355","https://openalex.org/W1989692914","https://openalex.org/W1990650244","https://openalex.org/W1994726788","https://openalex.org/W2001074797","https://openalex.org/W2025183033","https://openalex.org/W2049633694","https://openalex.org/W2062313495","https://openalex.org/W2064387721","https://openalex.org/W2073680033","https://openalex.org/W2075453090","https://openalex.org/W2078055172","https://openalex.org/W2099878672","https://openalex.org/W2103133389","https://openalex.org/W2104863866","https://openalex.org/W2107750953","https://openalex.org/W2113547287","https://openalex.org/W2115067168","https://openalex.org/W2116137244","https://openalex.org/W2128598176","https://openalex.org/W2128709328","https://openalex.org/W2142534468","https://openalex.org/W2161340280","https://openalex.org/W2167433878","https://openalex.org/W2305001871","https://openalex.org/W2404352102","https://openalex.org/W2478818565","https://openalex.org/W2586452038","https://openalex.org/W2603869849","https://openalex.org/W2769195552","https://openalex.org/W2810822878","https://openalex.org/W2890027086","https://openalex.org/W2941876699","https://openalex.org/W2951601728","https://openalex.org/W2953042718","https://openalex.org/W2962777160","https://openalex.org/W2962934207","https://openalex.org/W2963131997","https://openalex.org/W2963254535","https://openalex.org/W2963347209","https://openalex.org/W2963483298","https://openalex.org/W2963561977","https://openalex.org/W2963656210","https://openalex.org/W2963888630","https://openalex.org/W2964231067","https://openalex.org/W2964276553","https://openalex.org/W2964293062","https://openalex.org/W2970389665","https://openalex.org/W2989681379","https://openalex.org/W2997048015","https://openalex.org/W3100688298","https://openalex.org/W3104370808","https://openalex.org/W3122960922","https://openalex.org/W3168044932","https://openalex.org/W3170733181","https://openalex.org/W3176229821","https://openalex.org/W3177266934","https://openalex.org/W3184934179","https://openalex.org/W3194095253","https://openalex.org/W4250059046","https://openalex.org/W4292403327","https://openalex.org/W4310895557","https://openalex.org/W6677121468","https://openalex.org/W6704886596"],"related_works":["https://openalex.org/W1972942382","https://openalex.org/W2009962825","https://openalex.org/W1722744795","https://openalex.org/W124275629","https://openalex.org/W2136727990","https://openalex.org/W4287662864","https://openalex.org/W2950014027","https://openalex.org/W2952991236","https://openalex.org/W964575223","https://openalex.org/W4296948412"],"abstract_inverted_index":{"Data":[0],"augmentation":[1],"(DA)":[2],"algorithms":[3],"are":[4,106,194],"slow":[5],"in":[6,157],"massive":[7],"data":[8,65,87,101],"settings":[9],"due":[10],"to":[11],"multiple":[12],"passes":[13],"through":[14],"the":[15,45,63,85,95,99,109,122,130,138,164,168,174],"entire":[16,64],"data.":[17,118],"We":[18,119,142,161],"address":[19],"this":[20,192],"problem":[21],"by":[22,55,61],"developing":[23],"a":[24,56],"DA":[25,35,43,47,140],"extension":[26],"that":[27,121,144],"exploits":[28],"asynchronous":[29],"and":[30,40,59,70,93,113],"distributed":[31],"computing.":[32],"The":[33,103],"extended":[34],"algorithm":[36],"is":[37,53,126,146],"called":[38],"Asynchronous":[39],"Distributed":[41],"(AD)":[42],"with":[44,89,129],"original":[46],"as":[48],"its":[49,150],"parent.":[50],"Any":[51],"ADDA":[52,79,123,145,169],"indexed":[54],"parameter":[57,104],"r\u2208(0,1)":[58],"starts":[60],"dividing":[62],"into":[66],"k":[67,74,86],"disjoint":[68],"subsets":[69,88],"storing":[71],"them":[72],"on":[73,137],"processes.":[75],"Every":[76],"iteration":[77],"of":[78,84,98,111,115,167,185],"augments":[80],"only":[81],"an":[82],"r-fraction":[83,110],"some":[90],"positive":[91],"probability":[92],"leaves":[94],"remaining":[96],"(1\u2212r)-fraction":[97,114],"augmented":[100,117],"unchanged.":[102],"draws":[105],"obtained":[107],"using":[108],"new":[112],"old":[116],"show":[120],"Markov":[124,170],"chain":[125,171],"Harris":[127],"ergodic":[128],"desired":[131,186],"stationary":[132],"distribution":[133],"under":[134],"mild":[135],"conditions":[136],"parent":[139,151],"algorithm.":[141],"demonstrate":[143],"significantly":[147],"faster":[148],"than":[149],"for":[152,172,183,191],"many":[153],"(k,":[154],"r)":[155],"choices":[156],"three":[158,175],"representative":[159],"models.":[160],"also":[162],"establish":[163],"geometric":[165],"ergodicity":[166],"all":[173],"models,":[176],"which":[177],"yields":[178],"asymptotically":[179],"valid":[180],"standard":[181],"errors":[182],"estimates":[184],"posterior":[187],"quantities.":[188],"Supplementary":[189],"materials":[190],"article":[193],"available":[195],"online.":[196]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
