{"id":"https://openalex.org/W4385623118","doi":"https://doi.org/10.1145/3588195.3592992","title":"Rapidgzip: Parallel Decompression and Seeking in Gzip Files Using Cache Prefetching","display_name":"Rapidgzip: Parallel Decompression and Seeking in Gzip Files Using Cache Prefetching","publication_year":2023,"publication_date":"2023-08-07","ids":{"openalex":"https://openalex.org/W4385623118","doi":"https://doi.org/10.1145/3588195.3592992"},"language":"en","primary_location":{"id":"doi:10.1145/3588195.3592992","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3588195.3592992","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd International Symposium on High-Performance Parallel and Distributed Computing","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2308.08955","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028422914","display_name":"Maximilian Knespel","orcid":"https://orcid.org/0000-0001-9568-3075"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"TU Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Maximilian Knespel","raw_affiliation_strings":["Technische Universit\u00e4t Dresden, Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Dresden, Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063897980","display_name":"Holger Brunst","orcid":"https://orcid.org/0000-0003-2224-0630"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"TU Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Holger Brunst","raw_affiliation_strings":["Technische Universit\u00e4t Dresden, Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Dresden, Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5028422914"],"corresponding_institution_ids":["https://openalex.org/I78650965"],"apc_list":null,"apc_paid":null,"fwci":1.2306,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.83391914,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"295","last_page":"307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8903970718383789},{"id":"https://openalex.org/keywords/byte","display_name":"Byte","score":0.6813436150550842},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6426083445549011},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6397022008895874},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5455521941184998},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.4749346375465393},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3154789209365845},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15480461716651917}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8903970718383789},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.6813436150550842},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6426083445549011},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6397022008895874},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5455521941184998},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.4749346375465393},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3154789209365845},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15480461716651917}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3588195.3592992","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3588195.3592992","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd International Symposium on High-Performance Parallel and Distributed Computing","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2308.08955","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.08955","pdf_url":"https://arxiv.org/pdf/2308.08955","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2308.08955","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.08955","pdf_url":"https://arxiv.org/pdf/2308.08955","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321613","display_name":"Technische Universit\u00e4t Dresden","ror":"https://ror.org/042aqky30"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385623118.pdf"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W220935706","https://openalex.org/W1777016212","https://openalex.org/W1877865836","https://openalex.org/W2022126655","https://openalex.org/W2024171325","https://openalex.org/W2059343366","https://openalex.org/W2060108852","https://openalex.org/W2107745473","https://openalex.org/W2294693415","https://openalex.org/W2887854925","https://openalex.org/W2963235000","https://openalex.org/W2965674501","https://openalex.org/W2965891918","https://openalex.org/W3014663963","https://openalex.org/W4230804723","https://openalex.org/W4249806163"],"related_works":["https://openalex.org/W2317245370","https://openalex.org/W4249323025","https://openalex.org/W198851386","https://openalex.org/W2030310580","https://openalex.org/W947442053","https://openalex.org/W1980160788","https://openalex.org/W2148915962","https://openalex.org/W2283866686","https://openalex.org/W4287182096","https://openalex.org/W27867058"],"abstract_inverted_index":{"Gzip":[0],"is":[1,7],"a":[2,11,51,93,96,118,140,156],"file":[3,79,120],"compression":[4],"format,":[5],"which":[6,107],"ubiquitously":[8],"used.":[9],"Although":[10],"multitude":[12],"of":[13,53,117,142,158],"gzip":[14,33,119],"implementations":[15],"exist,":[16],"only":[17,41],"pugz":[18,29,59,83],"can":[19,61,84,101,108],"fully":[20],"utilize":[21],"current":[22],"multi-core":[23],"processor":[24],"architectures":[25],"for":[26,136,152],"decompression.":[27],"Yet,":[28],"cannot":[30],"decompress":[31],"arbitrary":[32,66],"files.":[34],"It":[35],"requires":[36],"the":[37,54,75,78,115,145,153],"decompressed":[38],"stream":[39],"to":[40,65],"contain":[42],"byte":[43],"values":[44],"9-126.":[45],"In":[46],"this":[47],"work,":[48],"we":[49],"present":[50],"generalization":[52],"parallelization":[55],"scheme":[56],"used":[57],"by":[58,82,87,121],"that":[60,74],"be":[62,85],"reliably":[63],"applied":[64],"gzip-compressed":[67,137],"data":[68],"without":[69],"compromising":[70],"performance.":[71],"We":[72],"show":[73],"requirements":[76],"on":[77,92],"contents":[80],"posed":[81],"dropped":[86],"implementing":[88],"an":[89],"architecture":[90,100],"based":[91],"cache":[94],"and":[95,124,149],"parallelized":[97],"prefetcher.":[98],"This":[99],"safely":[102],"handle":[103],"faulty":[104],"decompression":[105,134],"results,":[106],"appear":[109],"when":[110],"threads":[111],"start":[112],"decompressing":[113],"in":[114],"middle":[116],"using":[122],"trial":[123],"error.":[125],"Using":[126],"128":[127],"cores,":[128],"our":[129],"implementation":[130],"reaches":[131],"8.7":[132],"GB/s":[133,151],"bandwidth":[135],"base64-encoded":[138],"data,":[139],"speedup":[141,157],"55":[143],"over":[144,160],"single-threaded":[146],"GNU":[147,161],"gzip,":[148],"5.6":[150],"Silesia":[154],"corpus,":[155],"33":[159],"gzip.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2023-08-08T00:00:00"}
