{"id":"https://openalex.org/W7125180742","doi":"https://doi.org/10.48550/arxiv.2601.13220","title":"The Energy-Throughput Trade-off in Lossless-Compressed Source Code Storage","display_name":"The Energy-Throughput Trade-off in Lossless-Compressed Source Code Storage","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7125180742","doi":"https://doi.org/10.48550/arxiv.2601.13220"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.13220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.13220","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046786328","display_name":"Paolo Ferragina","orcid":"https://orcid.org/0000-0003-1353-360X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ferragina, Paolo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003830291","display_name":"Francesco Tosoni","orcid":"https://orcid.org/0000-0001-8457-3866"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tosoni, Francesco","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5046786328"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.4733000099658966,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.4733000099658966,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.25609999895095825,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.04270000010728836,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5996999740600586},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5659000277519226},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5627999901771545},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5113999843597412},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.447299987077713},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.439300000667572},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4271000027656555},{"id":"https://openalex.org/keywords/computer-data-storage","display_name":"Computer data storage","score":0.4099999964237213}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.738099992275238},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5996999740600586},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5659000277519226},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5627999901771545},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5113999843597412},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.447299987077713},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.439300000667572},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4271000027656555},{"id":"https://openalex.org/C194739806","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Computer data storage","level":2,"score":0.4099999964237213},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4009999930858612},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.36500000953674316},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.34130001068115234},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.32420000433921814},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3093999922275543},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.3043000102043152},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2897999882698059},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.2786000072956085},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.27799999713897705},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.2734000086784363},{"id":"https://openalex.org/C121957198","wikidata":"https://www.wikidata.org/wiki/Q14365593","display_name":"KPI-driven code analysis","level":5,"score":0.26980000734329224},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.2623000144958496},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.2583000063896179},{"id":"https://openalex.org/C2982719155","wikidata":"https://www.wikidata.org/wiki/Q25584060","display_name":"Energy source","level":3,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.13220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.13220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.42020806670188904,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Retrieving":[0],"data":[1,90],"from":[2],"large-scale":[3,39],"source":[4,40],"code":[5,41,161],"archives":[6],"is":[7,103],"vital":[8],"for":[9,35,152,158],"AI":[10],"training,":[11],"neural-based":[12],"software":[13],"analysis,":[14],"and":[15,25,55,78,84,92,113,130,149],"information":[16],"retrieval,":[17],"to":[18],"cite":[19],"a":[20,31,61,118,143],"few.":[21],"This":[22,122],"paper":[23],"studies":[24],"experiments":[26,59],"with":[27,74,142],"the":[28,36,107,115],"design":[29],"of":[30,38,110,117,145],"compressed":[32],"key-value":[33],"store":[34],"indexing":[37],"datasets,":[42],"evaluating":[43],"its":[44],"trade-off":[45],"among":[46],"three":[47],"primary":[48],"computational":[49],"resources:":[50],"(compressed)":[51],"space":[52],"occupancy,":[53],"time,":[54],"energy":[56,85,101],"efficiency.":[57,86],"Extensive":[58],"on":[60],"national":[62],"high-performance":[63],"computing":[64],"infrastructure":[65],"demonstrate":[66],"that":[67],"different":[68],"compression":[69,76],"configurations":[70],"yield":[71],"distinct":[72],"trade-offs,":[73],"high":[75],"ratios":[77],"order-of-magnitude":[79],"gains":[80],"in":[81,126,135],"retrieval":[82],"throughput":[83],"We":[87],"also":[88],"study":[89],"parallelism":[91],"show":[93],"that,":[94],"while":[95],"it":[96],"significantly":[97],"improves":[98],"speed,":[99],"scaling":[100],"efficiency":[102],"more":[104],"difficult,":[105],"reflecting":[106],"known":[108],"non-energy-proportionality":[109],"modern":[111],"hardware":[112],"challenging":[114],"assumption":[116],"direct":[119],"time-energy":[120],"correlation.":[121],"work":[123],"streamlines":[124],"automation":[125],"energy-aware":[127],"configuration":[128],"tuning":[129],"standardized":[131],"green":[132],"benchmarking":[133],"deployable":[134],"CI/CD":[136],"pipelines,":[137],"thus":[138],"empowering":[139],"system":[140],"architects":[141],"spectrum":[144],"Pareto-optimal":[146],"energy-compression-throughput":[147],"trade-offs":[148],"actionable":[150],"guidelines":[151],"building":[153],"sustainable,":[154],"efficient":[155],"storage":[156],"backends":[157],"massive":[159],"open-source":[160],"archival.":[162]},"counts_by_year":[],"updated_date":"2026-01-22T23:33:04.759266","created_date":"2026-01-22T00:00:00"}
