{"id":"https://openalex.org/W7143300850","doi":"https://doi.org/10.48550/arxiv.2603.25839","title":"A Compression Perspective on Simplicity Bias","display_name":"A Compression Perspective on Simplicity Bias","publication_year":2026,"publication_date":"2026-03-26","ids":{"openalex":"https://openalex.org/W7143300850","doi":"https://doi.org/10.48550/arxiv.2603.25839"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.25839","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130988607","display_name":"Tom Marty","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Marty, Tom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130990235","display_name":"Eric Elmoznino","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elmoznino, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051274578","display_name":"L\u00e9o Gagnon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gagnon, Leo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130917456","display_name":"Tejas Kasetty","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kasetty, Tejas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057585119","display_name":"Mizu Nishikawa-Toomey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nishikawa-Toomey, Mizu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020059055","display_name":"Sarthak Mittal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mittal, Sarthak","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130926450","display_name":"Guillaume Lajoie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lajoie, Guillaume","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5109398524","display_name":"Dhanya Sridhar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sridhar, Dhanya","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5130988607"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.36730000376701355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.36730000376701355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.14650000631809235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.14499999582767487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/simplicity","display_name":"Simplicity","score":0.6880000233650208},{"id":"https://openalex.org/keywords/spurious-relationship","display_name":"Spurious relationship","score":0.6646999716758728},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.6438999772071838},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5928999781608582},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5612000226974487},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.44339999556541443},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4120999872684479},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.38690000772476196},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.3792000114917755},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.36890000104904175}],"concepts":[{"id":"https://openalex.org/C2776372474","wikidata":"https://www.wikidata.org/wiki/Q508291","display_name":"Simplicity","level":2,"score":0.6880000233650208},{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.6646999716758728},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.6438999772071838},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6241999864578247},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5928999781608582},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5612000226974487},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5092999935150146},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.44339999556541443},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42660000920295715},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4120999872684479},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4018000066280365},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.38690000772476196},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.3792000114917755},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.36890000104904175},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.3490999937057495},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.3458999991416931},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.32109999656677246},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C16811321","wikidata":"https://www.wikidata.org/wiki/Q17138905","display_name":"Minimum redundancy feature selection","level":3,"score":0.30880001187324524},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.27469998598098755},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.2728999853134155},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2630000114440918},{"id":"https://openalex.org/C87465248","wikidata":"https://www.wikidata.org/wiki/Q1417790","display_name":"Minimum description length","level":2,"score":0.26030001044273376},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2529999911785126},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deep":[0],"neural":[1,57,173],"networks":[2,58,174],"exhibit":[3],"a":[4,7,40,60,146,164],"simplicity":[5,51],"bias,":[6],"well-documented":[8],"tendency":[9],"to":[10,104],"favor":[11],"simple":[12,101],"functions":[13],"over":[14],"complex":[15,105,156],"ones.":[16],"In":[17],"this":[18,25],"work,":[19],"we":[20,122],"cast":[21],"new":[22],"light":[23],"on":[24,163],"phenomenon":[26],"through":[27,59,95],"the":[28,31,70,79,86,110,117,152,169,176],"lens":[29],"of":[30,42,68,77,88,148,154,172,179],"Minimum":[32],"Description":[33],"Length":[34],"principle,":[35],"formalizing":[36],"supervised":[37],"learning":[38,153],"as":[39,85,145,181],"problem":[41],"optimal":[43,182],"two-part":[44,183],"lossless":[45],"compression.":[46],"Our":[47,81],"theory":[48,162],"explains":[49],"how":[50],"bias":[52],"governs":[53],"feature":[54,170],"selection":[55,171],"in":[56,112],"fundamental":[61],"trade-off":[62],"between":[63],"model":[64,119],"complexity":[65],"(the":[66,75],"cost":[67,76,115],"describing":[69,78],"hypothesis)":[71],"and":[72,137],"predictive":[73],"power":[74],"data).":[80],"framework":[82],"predicts":[83],"that":[84,168],"amount":[87],"available":[89],"training":[90],"data":[91,113,125,129,142],"increases,":[92],"learners":[93],"transition":[94],"qualitatively":[96],"different":[97],"features":[98,106],"--":[99,107],"from":[100],"spurious":[102],"shortcuts":[103],"only":[108],"when":[109],"reduction":[111],"encoding":[114],"justifies":[116],"increased":[118],"complexity.":[120],"Consequently,":[121],"identify":[123],"distinct":[124],"regimes":[126,139],"where":[127,140],"increasing":[128],"promotes":[130],"robustness":[131],"by":[132],"ruling":[133],"out":[134],"trivial":[135],"shortcuts,":[136],"conversely,":[138],"limiting":[141],"can":[143],"act":[144],"form":[147],"complexity-based":[149],"regularization,":[150],"preventing":[151],"unreliable":[155],"environmental":[157],"cues.":[158],"We":[159],"validate":[160],"our":[161],"semi-synthetic":[165],"benchmark":[166],"showing":[167],"follows":[175],"same":[177],"trajectory":[178],"solutions":[180],"compressors.":[184]},"counts_by_year":[],"updated_date":"2026-03-31T06:07:48.031334","created_date":"2026-03-31T00:00:00"}
