{"id":"https://openalex.org/W7127361062","doi":"https://doi.org/10.48550/arxiv.2602.02190","title":"PCA of probability measures: Sparse and Dense sampling regimes","display_name":"PCA of probability measures: Sparse and Dense sampling regimes","publication_year":2026,"publication_date":"2026-02-02","ids":{"openalex":"https://openalex.org/W7127361062","doi":"https://doi.org/10.48550/arxiv.2602.02190"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.02190","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124942084","display_name":"Gachon Erell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Erell, Gachon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122995162","display_name":"J\u00e9r\u00e9mie Bigot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bigot, J\u00e9r\u00e9mie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028493116","display_name":"Elsa Cazelles","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cazelles, Elsa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.5080999732017517,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.5080999732017517,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.12409999966621399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.06780000030994415,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/covariance-operator","display_name":"Covariance operator","score":0.6381000280380249},{"id":"https://openalex.org/keywords/minimax","display_name":"Minimax","score":0.6301000118255615},{"id":"https://openalex.org/keywords/covariance","display_name":"Covariance","score":0.6043000221252441},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5547000169754028},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.5286999940872192},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5060999989509583},{"id":"https://openalex.org/keywords/probability-measure","display_name":"Probability measure","score":0.4991999864578247},{"id":"https://openalex.org/keywords/hilbert-space","display_name":"Hilbert space","score":0.45249998569488525}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.7533000111579895},{"id":"https://openalex.org/C103692563","wikidata":"https://www.wikidata.org/wiki/Q5178900","display_name":"Covariance operator","level":3,"score":0.6381000280380249},{"id":"https://openalex.org/C149728462","wikidata":"https://www.wikidata.org/wiki/Q751319","display_name":"Minimax","level":2,"score":0.6301000118255615},{"id":"https://openalex.org/C178650346","wikidata":"https://www.wikidata.org/wiki/Q201984","display_name":"Covariance","level":2,"score":0.6043000221252441},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5547000169754028},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.5286999940872192},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5060999989509583},{"id":"https://openalex.org/C21031990","wikidata":"https://www.wikidata.org/wiki/Q355020","display_name":"Probability measure","level":2,"score":0.4991999864578247},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.4740999937057495},{"id":"https://openalex.org/C62799726","wikidata":"https://www.wikidata.org/wiki/Q190056","display_name":"Hilbert space","level":2,"score":0.45249998569488525},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.4296000003814697},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.42149999737739563},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.41760000586509705},{"id":"https://openalex.org/C206654554","wikidata":"https://www.wikidata.org/wiki/Q5374247","display_name":"Empirical measure","level":2,"score":0.41280001401901245},{"id":"https://openalex.org/C185142706","wikidata":"https://www.wikidata.org/wiki/Q1134404","display_name":"Covariance matrix","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.36329999566078186},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.35600000619888306},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.35260000824928284},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.337799996137619},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.2955000102519989},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C24252448","wikidata":"https://www.wikidata.org/wiki/Q7573786","display_name":"Sparse PCA","level":3,"score":0.2549999952316284}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.02190","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.02190","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.02190","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.02190","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"A":[0],"common":[1],"approach":[2],"to":[3,10,121],"perform":[4],"PCA":[5,20,55,88,158],"on":[6,94],"probability":[7,63],"measures":[8,64,107],"is":[9,137],"embed":[11],"them":[12],"into":[13],"a":[14,31,57,117],"Hilbert":[15],"space":[16],"where":[17,61,91],"standard":[18],"functional":[19],"techniques":[21],"apply.":[22],"While":[23],"convergence":[24,73,128],"rates":[25,74,151],"for":[26,81,140],"estimating":[27],"the":[28,40,45,76,82,87,95,100,103,109,127,134,141],"embedding":[29],"of":[30,75,106,112],"single":[32],"measure":[33],"from":[34],"$m$":[35,69,111],"samples":[36,113],"are":[37,65],"well":[38],"understood,":[39],"literature":[41],"has":[42],"not":[43],"addressed":[44],"setting":[46],"involving":[47],"multiple":[48],"measures.":[49],"In":[50],"this":[51],"paper,":[52],"we":[53,131],"study":[54],"in":[56,126],"double":[58],"asymptotic":[59],"regime":[60],"$n$":[62,105],"observed,":[66],"each":[67],"through":[68],"samples.":[70],"We":[71],"derive":[72],"form":[77],"$n^{-1/2}":[78],"+":[79],"m^{-\u03b1}$":[80],"empirical":[83,142],"covariance":[84,143],"operator":[85],"and":[86,108,152],"excess":[89],"risk,":[90],"$\u03b1&gt;0$":[92],"depends":[93],"chosen":[96],"embedding.":[97],"This":[98],"characterizes":[99],"relationship":[101],"between":[102],"number":[104,110],"per":[114],"measure,":[115],"revealing":[116],"sparse":[118],"(small":[119],"$m$)":[120,124],"dense":[122],"(large":[123],"transition":[125],"behavior.":[129],"Moreover,":[130],"prove":[132],"that":[133,154],"dense-regime":[135],"rate":[136],"minimax":[138],"optimal":[139],"error.":[144],"Our":[145],"numerical":[146],"experiments":[147],"validate":[148],"these":[149],"theoretical":[150],"demonstrate":[153],"appropriate":[155],"subsampling":[156],"preserves":[157],"accuracy":[159],"while":[160],"reducing":[161],"computational":[162],"cost.":[163]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-04T00:00:00"}
