{"id":"https://openalex.org/W7131432886","doi":"https://doi.org/10.48550/arxiv.2602.20698","title":"High-Dimensional Robust Mean Estimation with Untrusted Batches","display_name":"High-Dimensional Robust Mean Estimation with Untrusted Batches","publication_year":2026,"publication_date":"2026-02-24","ids":{"openalex":"https://openalex.org/W7131432886","doi":"https://doi.org/10.48550/arxiv.2602.20698"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.20698","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.20698","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.20698","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126782762","display_name":"Maryam Aliakbarpour","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Aliakbarpour, Maryam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126809081","display_name":"Vladimir Braverman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Braverman, Vladimir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126825772","display_name":"Yuhan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yuhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126817507","display_name":"Junze Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Junze","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5126782762"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.3224000036716461,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.3224000036716461,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.25099998712539673,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.11069999635219574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fraction","display_name":"Fraction (chemistry)","score":0.5936999917030334},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.4860999882221222},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.48570001125335693},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.45989999175071716},{"id":"https://openalex.org/keywords/distribution","display_name":"Distribution (mathematics)","score":0.423799991607666},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4088999927043915},{"id":"https://openalex.org/keywords/statistical-inference","display_name":"Statistical inference","score":0.3292999863624573},{"id":"https://openalex.org/keywords/language-change","display_name":"Language change","score":0.3176000118255615},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.31459999084472656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5952000021934509},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.5936999917030334},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.4860999882221222},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.48570001125335693},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.45989999175071716},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.423799991607666},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3935000002384186},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.367900013923645},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.34769999980926514},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32580000162124634},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3249000012874603},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3237000107765198},{"id":"https://openalex.org/C2780027415","wikidata":"https://www.wikidata.org/wiki/Q524648","display_name":"Language change","level":2,"score":0.3176000118255615},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.3133000135421753},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.3021000027656555},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C62100291","wikidata":"https://www.wikidata.org/wiki/Q1936288","display_name":"Total variation","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C58948655","wikidata":"https://www.wikidata.org/wiki/Q7604392","display_name":"Statistical distance","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C2781039887","wikidata":"https://www.wikidata.org/wiki/Q1391724","display_name":"Factor (programming language)","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C98385598","wikidata":"https://www.wikidata.org/wiki/Q1339385","display_name":"Empirical distribution function","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C87007009","wikidata":"https://www.wikidata.org/wiki/Q210832","display_name":"Statistical hypothesis testing","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C67226441","wikidata":"https://www.wikidata.org/wiki/Q1665389","display_name":"Robust statistics","level":3,"score":0.26260000467300415},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C75438885","wikidata":"https://www.wikidata.org/wiki/Q3403615","display_name":"Large deviations theory","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.20698","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.20698","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.20698","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.20698","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.807201623916626}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,50,173],"study":[1],"high-dimensional":[2,111],"mean":[3,30],"estimation":[4],"in":[5,16,104,153],"a":[6,24,33,38,55,83,127,160,215],"collaborative":[7],"setting":[8],"where":[9],"data":[10,72],"is":[11,212],"contributed":[12],"by":[13,82,214,225],"$N$":[14],"users":[15,62,70,211],"batches":[17,121],"of":[18,32,40,61,129,135,163,209,217],"size":[19],"$n$.":[20],"In":[21,144],"this":[22,52,98,182],"environment,":[23],"learner":[25],"seeks":[26],"to":[27,78,180,220],"recover":[28],"the":[29,67,91,109,146,188,207,221,226],"$\u03bc$":[31],"true":[34],"distribution":[35],"$P$":[36],"from":[37,73,124],"collection":[39],"sources":[41],"that":[42,75,198],"are":[43,63,76,122,141],"both":[44],"statistically":[45],"heterogeneous":[46],"and":[47,170],"potentially":[48],"malicious.":[49],"formalize":[51],"challenge":[53],"through":[54],"double":[56],"corruption":[57,165],"landscape:":[58],"an":[59,133,203],"$\\varepsilon$-fraction":[60],"entirely":[64],"adversarial,":[65],"while":[66,199],"remaining":[68],"``good''":[69],"provide":[71,174],"distributions":[74,125],"related":[77],"$P$,":[79],"but":[80],"deviate":[81],"proximity":[84],"parameter":[85],"$\u03b1$.":[86],"Unlike":[87],"existing":[88],"work":[89],"on":[90],"untrusted":[92],"batch":[93,140,227],"model,":[94],"which":[95],"typically":[96],"measures":[97],"deviation":[99],"via":[100],"total":[101],"variation":[102],"distance":[103],"discrete":[105,157],"settings,":[106,158],"we":[107],"address":[108],"continuous,":[110],"regime":[112],"under":[113],"two":[114,175],"natural":[115],"variants":[116],"for":[117],"deviation:":[118],"(1)":[119],"good":[120,139],"drawn":[123],"with":[126],"mean-shift":[128],"$\\sqrt\u03b1$,":[130],"or":[131],"(2)":[132],"$\u03b1$-fraction":[134],"samples":[136],"within":[137],"each":[138],"adversarially":[142],"corrupted.":[143],"particular,":[145],"second":[147],"model":[148],"presents":[149],"significant":[150],"new":[151],"challenges:":[152],"high":[154],"dimensions,":[155],"unlike":[156],"even":[159],"small":[161],"fraction":[162],"sample-level":[164],"can":[166],"shift":[167],"empirical":[168],"means":[169],"covariances":[171],"arbitrarily.":[172],"Sum-of-Squares":[176],"(SoS)":[177],"based":[178],"algorithms":[179,186],"navigate":[181],"tiered":[183],"corruption.":[184],"Our":[185],"achieve":[187],"minimax-optimal":[189],"error":[190],"rate":[191],"$O(\\sqrt{\\varepsilon/n}":[192],"+":[193,195],"\\sqrt{d/nN}":[194],"\\sqrt\u03b1)$,":[196],"demonstrating":[197],"heterogeneity":[200],"$\u03b1$":[201],"represents":[202],"inherent":[204],"statistical":[205],"difficulty,":[206],"influence":[208],"adversarial":[210],"suppressed":[213],"factor":[216],"$1/\\sqrt{n}$":[218],"due":[219],"internal":[222],"averaging":[223],"afforded":[224],"structure.":[228]},"counts_by_year":[],"updated_date":"2026-02-26T06:34:08.959763","created_date":"2026-02-26T00:00:00"}
