{"id":"https://openalex.org/W7128644877","doi":"https://doi.org/10.48550/arxiv.2602.09789","title":"When Less is More: The LLM Scaling Paradox in Context Compression","display_name":"When Less is More: The LLM Scaling Paradox in Context Compression","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128644877","doi":"https://doi.org/10.48550/arxiv.2602.09789"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.09789","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125623843","display_name":"Ruishan Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Ruishan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125663152","display_name":"Yibing Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yibing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125675336","display_name":"Guoxin Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Guoxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125629492","display_name":"Yan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124889512","display_name":"Yueyang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yueyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125657787","display_name":"Long Xia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Long","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125642997","display_name":"Kecheng Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Kecheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125640374","display_name":"Zhiyuan Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Zhiyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125663135","display_name":"Daiting Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Daiting","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2531999945640564,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2531999945640564,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1039000004529953,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.08290000259876251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.6431999802589417},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5964999794960022},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5295000076293945},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.51419997215271},{"id":"https://openalex.org/keywords/paraphrase","display_name":"Paraphrase","score":0.47200000286102295},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4415000081062317},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.4390000104904175},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4334999918937683},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.4122999906539917}],"concepts":[{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.6431999802589417},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5964999794960022},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5655999779701233},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5295000076293945},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.51419997215271},{"id":"https://openalex.org/C2780922921","wikidata":"https://www.wikidata.org/wiki/Q255189","display_name":"Paraphrase","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4415000081062317},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.4390000104904175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43560001254081726},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4334999918937683},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.4122999906539917},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.40130001306533813},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3950999975204468},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.3630000054836273},{"id":"https://openalex.org/C76188268","wikidata":"https://www.wikidata.org/wiki/Q1783165","display_name":"Context effect","level":3,"score":0.3336000144481659},{"id":"https://openalex.org/C94835093","wikidata":"https://www.wikidata.org/wiki/Q3113333","display_name":"Data compression ratio","level":5,"score":0.3253999948501587},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3246000111103058},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.3102000057697296},{"id":"https://openalex.org/C57654395","wikidata":"https://www.wikidata.org/wiki/Q1097775","display_name":"Compression artifact","level":5,"score":0.30480000376701355},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30469998717308044},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2856000065803528},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.267300009727478},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.266400009393692},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C137546455","wikidata":"https://www.wikidata.org/wiki/Q3213474","display_name":"Trigram","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C167981619","wikidata":"https://www.wikidata.org/wiki/Q1685498","display_name":"Cross entropy","level":3,"score":0.2549000084400177},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.09789","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.09789","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09789","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.09789","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Scaling":[0],"up":[1],"model":[2,55],"parameters":[3],"has":[4],"long":[5],"been":[6],"a":[7,28,33,179],"prevalent":[8],"training":[9],"paradigm":[10],"driven":[11],"by":[12],"the":[13,41,136,185],"assumption":[14],"that":[15,148],"larger":[16,73,96,129],"models":[17,74,97],"yield":[18],"superior":[19],"generation":[20,190],"capabilities.":[21],"However,":[22],"under":[23],"lossy":[24],"context":[25,175],"compression":[26,59,176],"in":[27,131],"compressor--decoder":[29],"setup,":[30],"we":[31,61,145],"find":[32],"\\textbf{\\textit{Size-Fidelity":[34],"Paradox}}:":[35],"increasing":[36],"compressor":[37,52],"size":[38],"can":[39],"lessen":[40],"faithfulness":[42],"of":[43,105,174,181],"reconstructed":[44],"contexts":[45],"though":[46],"reconstruction":[47,143],"error":[48],"decreases.":[49],"Across":[50],"27":[51],"setups":[53],"spanning":[54],"families,":[56],"scales,":[57],"and":[58,92,142,166,177],"rates,":[60],"coin":[62],"this":[63,118],"paradox":[64,119],"arising":[65],"from":[66,188],"two":[67],"dominant":[68],"factors:":[69],"1)":[70],"\\textit{knowledge":[71],"overwriting}:":[72],"increasingly":[75],"replace":[76],"source":[77],"facts":[78],"with":[79,124],"their":[80],"own":[81],"prior":[82],"beliefs,":[83],"\\textit{e.g.},":[84,109],"``the":[85,89],"white":[86],"strawberry``":[87],"$\\to$":[88,113],"red":[90],"strawberry``;":[91],"2)":[93],"\\textit{semantic":[94],"drift}:":[95],"tend":[98,150],"to":[99,151,163,191],"paraphrase":[100],"or":[101],"restructure":[102],"content":[103],"instead":[104],"reproducing":[106],"it":[107],"verbatim,":[108],"``Alice":[110],"hit":[111,115],"Bob``":[112],"``Bob":[114],"Alice``.":[116],"Interestingly,":[117],"persists":[120],"across":[121,154],"varied":[122],"settings,":[123],"mid-sized":[125],"compressors":[126,149],"often":[127],"outperforming":[128],"ones":[130],"faithful":[132,192],"recovery.":[133,168],"By":[134],"analyzing":[135],"compressed":[137],"memory":[138,153],"via":[139],"embedding":[140],"geometry":[141],"determinacy,":[144],"further":[146],"reveal":[147],"organize":[152],"broader":[155],"semantic":[156],"subspaces,":[157],"yielding":[158],"more":[159],"ambiguous":[160],"representations":[161],"prone":[162],"overwriting,":[164],"drift,":[165],"weakened":[167],"These":[169],"findings":[170],"complement":[171],"existing":[172],"evaluations":[173],"expose":[178],"breakdown":[180],"scaling":[182],"laws":[183],"when":[184],"objective":[186],"shifts":[187],"plausible":[189],"preservation.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-12T00:00:00"}
