{"id":"https://openalex.org/W7161270950","doi":"https://doi.org/10.48550/arxiv.2605.14927","title":"Learning with Shallow Neural Networks on Cluster-Structured Features","display_name":"Learning with Shallow Neural Networks on Cluster-Structured Features","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161270950","doi":"https://doi.org/10.48550/arxiv.2605.14927"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.14927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.14927","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004244752","display_name":"Elisabetta Cornacchia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cornacchia, Elisabetta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136242649","display_name":"Laurent Massouli\u00e9","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Massouli\u00e9, Laurent","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.3499000072479248,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.3499000072479248,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1527000069618225,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.09489999711513519,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identifiability","display_name":"Identifiability","score":0.8008999824523926},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48429998755455017},{"id":"https://openalex.org/keywords/logarithm","display_name":"Logarithm","score":0.4830999970436096},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.45350000262260437},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4399000108242035},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.43720000982284546},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4156999886035919},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.38989999890327454}],"concepts":[{"id":"https://openalex.org/C122770356","wikidata":"https://www.wikidata.org/wiki/Q1656753","display_name":"Identifiability","level":2,"score":0.8008999824523926},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.555400013923645},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4893999993801117},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.45350000262260437},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4399000108242035},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.43720000982284546},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.423799991607666},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.38989999890327454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3756999969482422},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.373199999332428},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30059999227523804},{"id":"https://openalex.org/C2779127903","wikidata":"https://www.wikidata.org/wiki/Q6510194","display_name":"Learning rule","level":3,"score":0.28690001368522644},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C65965080","wikidata":"https://www.wikidata.org/wiki/Q1806885","display_name":"Latent variable model","level":3,"score":0.27900001406669617},{"id":"https://openalex.org/C129848803","wikidata":"https://www.wikidata.org/wiki/Q2564360","display_name":"Sample size determination","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C3020318244","wikidata":"https://www.wikidata.org/wiki/Q4812187","display_name":"Large sample","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.25429999828338623}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.14927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.14927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"success":[1],"of":[2,14,75,94,129,142],"deep":[3],"learning":[4,76],"in":[5,17,30],"high-dimensional":[6],"settings":[7],"is":[8,137,140],"often":[9],"attributed":[10],"to":[11,66,147],"the":[12,31,54,72,107,122,127,134,143],"presence":[13],"low-dimensional":[15,39],"structure":[16,28],"real-world":[18],"data.":[19,161],"While":[20],"standard":[21],"theoretical":[22,154],"models":[23],"typically":[24],"assume":[25],"that":[26,88,116],"this":[27,59],"lies":[29],"target":[32],"function,":[33],"projecting":[34],"unstructured":[35],"inputs":[36],"onto":[37],"a":[38,63,91,118],"subspace,":[40],"data":[41],"such":[42],"as":[43],"images,":[44],"text":[45],"or":[46],"genomic":[47],"sequences":[48],"exhibit":[49],"strong":[50],"spatial":[51],"correlations":[52,70],"within":[53],"input":[55,99,144],"space":[56],"itself.":[57],"In":[58],"paper,":[60],"we":[61,85,114],"propose":[62],"tractable":[64],"model":[65],"study":[67],"how":[68],"these":[69],"affect":[71],"sample":[73,123],"complexity":[74,124],"with":[77,106,126],"gradient":[78],"descent":[79],"on":[80,90,156],"shallow":[81],"neural":[82],"networks.":[83],"Specifically,":[84],"consider":[86],"targets":[87],"depend":[89],"small":[92],"number":[93,128],"latent":[95,108],"Boolean":[96],"variables,":[97],"and":[98,104,159],"features":[100],"grouped":[101],"into":[102],"clusters":[103],"correlated":[105],"variables.":[109],"Under":[110],"an":[111],"identifiability":[112],"assumption,":[113],"show":[115],"for":[117],"layerwise":[119],"gradient-descent":[120],"variant,":[121],"scales":[125],"hidden":[130],"variables":[131],"and,":[132],"when":[133],"signal-to-noise":[135],"ratio":[136],"sufficiently":[138],"high,":[139],"independent":[141],"dimension,":[145],"up":[146],"logarithmic":[148],"terms.":[149],"We":[150],"empirically":[151],"test":[152],"our":[153],"findings":[155],"both":[157],"synthetic":[158],"real":[160]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-16T00:00:00"}
