{"id":"https://openalex.org/W7162432819","doi":"https://doi.org/10.48550/arxiv.2605.25460","title":"Mean-Shift PCA by Knockoff Mean","display_name":"Mean-Shift PCA by Knockoff Mean","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162432819","doi":"https://doi.org/10.48550/arxiv.2605.25460"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.25460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.25460","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074974294","display_name":"Mengda Li","orcid":"https://orcid.org/0000-0002-3107-9482"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Mengda","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137030881","display_name":"Zeng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137052730","display_name":"Jianfeng Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Jianfeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.1307000070810318,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.1307000070810318,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.12380000203847885,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11716","display_name":"Random Matrices and Applications","score":0.06390000134706497,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.82669997215271},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.5770999789237976},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5663999915122986},{"id":"https://openalex.org/keywords/separable-space","display_name":"Separable space","score":0.499099999666214},{"id":"https://openalex.org/keywords/standard-deviation","display_name":"Standard deviation","score":0.44209998846054077},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.44130000472068787},{"id":"https://openalex.org/keywords/sparse-pca","display_name":"Sparse PCA","score":0.41749998927116394},{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.39739999175071716}],"concepts":[{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.82669997215271},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5856000185012817},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.5770999789237976},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5663999915122986},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.499099999666214},{"id":"https://openalex.org/C22679943","wikidata":"https://www.wikidata.org/wiki/Q159375","display_name":"Standard deviation","level":2,"score":0.44209998846054077},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.44130000472068787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42329999804496765},{"id":"https://openalex.org/C24252448","wikidata":"https://www.wikidata.org/wiki/Q7573786","display_name":"Sparse PCA","level":3,"score":0.41749998927116394},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.39739999175071716},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.361299991607666},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3407000005245209},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33390000462532043},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.27379998564720154},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C2777749129","wikidata":"https://www.wikidata.org/wiki/Q17148469","display_name":"Robust principal component analysis","level":3,"score":0.26759999990463257},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2549000084400177},{"id":"https://openalex.org/C64812099","wikidata":"https://www.wikidata.org/wiki/Q176604","display_name":"Random matrix","level":3,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.25460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.25460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Removing":[0],"noise":[1,6],"is":[2,7,30],"difficult,":[3],"but":[4],"adding":[5,125],"easy.":[8],"In":[9,57],"this":[10,114],"work,":[11],"we":[12,81,117],"show":[13],"how":[14],"to":[15,33,105],"eliminate":[16],"mean-shift":[17,26,67,85,133],"noisy":[18],"components":[19],"from":[20,44,77,90],"PCA":[21,29,62,122,138],"by":[22,124],"deliberately":[23],"introducing":[24],"knockoff":[25,126],"perturbation.":[27],"Standard":[28],"highly":[31],"sensitive":[32],"shifts":[34],"in":[35,52,71],"the":[36,53,66,72,84,91,95,99,106,110,132],"sample":[37],"mean:":[38],"a":[39,45,119],"small":[40],"fraction":[41],"of":[42,94,109],"samples":[43],"shifted":[46],"distribution":[47],"can":[48],"cause":[49],"large":[50],"deviations":[51],"leading":[54],"principal":[55],"components.":[56],"high-dimensional":[58],"regimes,":[59],"existing":[60],"Robust":[61],"approaches":[63],"cannot":[64],"handle":[65],"contamination":[68],"structure":[69],"inherent":[70],"mixture":[73,111],"model.":[74],"Using":[75],"tools":[76],"Random":[78],"Matrix":[79],"Theory,":[80],"prove":[82],"that":[83,128],"spikes":[86],"are":[87],"spectrally":[88],"separable":[89],"stable":[92],"eigenvalues":[93],"original":[96,100],"covariance.":[97],"Furthermore,":[98],"eigenspace":[101],"remains":[102],"asymptotically":[103],"invariant":[104],"contamination,":[107],"independent":[108],"weight.":[112],"Exploiting":[113],"spectral":[115],"stability,":[116],"propose":[118],"simple,":[120],"two-stage":[121],"algorithm":[123],"mean":[127],"identifies":[129],"and":[130],"removes":[131],"component":[134],"using":[135],"only":[136],"standard":[137],"operations.":[139]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
