{"id":"https://openalex.org/W7150877062","doi":"https://doi.org/10.48550/arxiv.2604.02343","title":"Haiku to Opus in Just 10 bits: LLMs Unlock Massive Compression Gains","display_name":"Haiku to Opus in Just 10 bits: LLMs Unlock Massive Compression Gains","publication_year":2026,"publication_date":"2026-02-09","ids":{"openalex":"https://openalex.org/W7150877062","doi":"https://doi.org/10.48550/arxiv.2604.02343"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.02343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.02343","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133014080","display_name":"Roy Rinberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rinberg, Roy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116335567","display_name":"Annabelle Michael Carrell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carrell, Annabelle Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133019390","display_name":"Simon Henniger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Henniger, Simon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133041094","display_name":"Nicholas Carlini","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carlini, Nicholas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133028014","display_name":"Keri Warr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Warr, Keri","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5133014080"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.7925000190734863,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.7925000190734863,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.03400000184774399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.03290000185370445,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.902899980545044},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.8962000012397766},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.609499990940094},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.6015999913215637},{"id":"https://openalex.org/keywords/arithmetic-coding","display_name":"Arithmetic coding","score":0.5835999846458435},{"id":"https://openalex.org/keywords/image-compression","display_name":"Image compression","score":0.5019000172615051},{"id":"https://openalex.org/keywords/color-cell-compression","display_name":"Color Cell Compression","score":0.5012000203132629},{"id":"https://openalex.org/keywords/data-compression-ratio","display_name":"Data compression ratio","score":0.4779999852180481}],"concepts":[{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.902899980545044},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.8962000012397766},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6406000256538391},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.609499990940094},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.6015999913215637},{"id":"https://openalex.org/C153338461","wikidata":"https://www.wikidata.org/wiki/Q2651","display_name":"Arithmetic coding","level":4,"score":0.5835999846458435},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.5019000172615051},{"id":"https://openalex.org/C82804729","wikidata":"https://www.wikidata.org/wiki/Q5148551","display_name":"Color Cell Compression","level":5,"score":0.5012000203132629},{"id":"https://openalex.org/C94835093","wikidata":"https://www.wikidata.org/wiki/Q3113333","display_name":"Data compression ratio","level":5,"score":0.4779999852180481},{"id":"https://openalex.org/C175732694","wikidata":"https://www.wikidata.org/wiki/Q1128713","display_name":"Context-adaptive binary arithmetic coding","level":3,"score":0.4708000123500824},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.46970000863075256},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.4318999946117401},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3813000023365021},{"id":"https://openalex.org/C54243161","wikidata":"https://www.wikidata.org/wiki/Q39333","display_name":"Texture compression","level":5,"score":0.3806999921798706},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.3630000054836273},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.3625999987125397},{"id":"https://openalex.org/C66656319","wikidata":"https://www.wikidata.org/wiki/Q2638","display_name":"Golomb coding","level":5,"score":0.34880000352859497},{"id":"https://openalex.org/C57654395","wikidata":"https://www.wikidata.org/wiki/Q1097775","display_name":"Compression artifact","level":5,"score":0.3310999870300293},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.302700012922287},{"id":"https://openalex.org/C57890076","wikidata":"https://www.wikidata.org/wiki/Q4680725","display_name":"Adaptive coding","level":4,"score":0.29030001163482666},{"id":"https://openalex.org/C169805256","wikidata":"https://www.wikidata.org/wiki/Q1361381","display_name":"Transform coding","level":4,"score":0.27619999647140503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27489998936653137},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2574999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.02343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.02343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4647369086742401}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,76],"study":[1],"the":[2,22,43,73,88,129],"compression":[3,18,41,63,80,149,163],"of":[4,24,65,128,151],"LLM-generated":[5],"text":[6],"across":[7],"lossless":[8,28],"and":[9,119,135,141],"lossy":[10,48,84],"regimes,":[11],"characterizing":[12],"a":[13,51,54,68,104,133],"compression-compute":[14],"frontier":[15],"where":[16],"more":[17,25,176],"is":[19,156],"possible":[20],"at":[21],"cost":[23],"compute.":[26],"For":[27,47],"compression,":[29,49],"domain-adapted":[30],"LoRA":[31],"adapters":[32],"can":[33,61,172],"improve":[34],"LLM-based":[35,162],"arithmetic":[36,59],"coding":[37,60],"by":[38,87,99],"2x":[39,69],"over":[40,71,157],"with":[42],"base":[44],"LLM":[45],"alone.":[46],"prompting":[50],"model":[52,94,137],"for":[53],"succinct":[55],"rewrite":[56],"then":[57],"applying":[58],"achieve":[62],"ratios":[64,150],"approximately":[66],"0.03,":[67],"improvement":[70],"compressing":[72],"original":[74],"response.":[75],"further":[77],"introduce":[78],"Question-Asking":[79],"(QA),":[81],"an":[82],"interactive":[83,170],"protocol":[85],"inspired":[86],"game":[89],"'Twenty":[90],"Questions'.":[91],"A":[92],"small":[93,134],"iteratively":[95],"refines":[96],"its":[97],"response":[98],"asking":[100],"yes/no":[101],"questions":[102,123],"to":[103,126,143,153],"stronger":[105],"model,":[106],"transferring":[107],"exactly":[108],"one":[109],"bit":[110],"per":[111],"answer.":[112],"On":[113],"8":[114],"benchmarks":[115,140],"spanning":[116],"math,":[117],"science,":[118],"code,":[120],"10":[121],"binary":[122],"recover":[124],"23%":[125],"72%":[127],"capability":[130],"gap":[131],"between":[132],"large":[136],"on":[138,145],"standard":[139],"7%":[142],"38%":[144],"harder":[146],"benchmarks,":[147],"achieving":[148],"0.0006":[152],"0.004.":[154],"This":[155],"100x":[158],"smaller":[159],"than":[160,178],"prior":[161],"(Deletang":[164],"et":[165],"al.,":[166],"2024),":[167],"suggesting":[168],"that":[169],"protocols":[171],"transfer":[173],"knowledge":[174],"far":[175],"efficiently":[177],"transmitting":[179],"full":[180],"responses.":[181]},"counts_by_year":[],"updated_date":"2026-04-07T06:06:30.997549","created_date":"2026-04-07T00:00:00"}
