{"id":"https://openalex.org/W4360985465","doi":"https://doi.org/10.1007/s41781-023-00095-9","title":"Fast Columnar Physics Analyses of Terabyte-Scale LHC Data on a Cache-Aware Dask Cluster","display_name":"Fast Columnar Physics Analyses of Terabyte-Scale LHC Data on a Cache-Aware Dask Cluster","publication_year":2023,"publication_date":"2023-03-20","ids":{"openalex":"https://openalex.org/W4360985465","doi":"https://doi.org/10.1007/s41781-023-00095-9"},"language":"en","primary_location":{"id":"doi:10.1007/s41781-023-00095-9","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s41781-023-00095-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41781-023-00095-9.pdf","source":{"id":"https://openalex.org/S4210229695","display_name":"Computing and Software for Big Science","issn_l":"2510-2036","issn":["2510-2036","2510-2044"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Software for Big Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s41781-023-00095-9.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013254371","display_name":"N. Eich","orcid":"https://orcid.org/0000-0001-9494-4317"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Niclas Eich","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049875695","display_name":"M. Erdmann","orcid":"https://orcid.org/0000-0002-1653-1303"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Erdmann","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015567755","display_name":"P. Fackeldey","orcid":"https://orcid.org/0000-0003-4932-7162"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Peter Fackeldey","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":"https://orcid.org/0000-0003-4932-7162","affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037598492","display_name":"Benjamin Fischer","orcid":"https://orcid.org/0000-0002-3900-3482"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Benjamin Fischer","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105514105","display_name":"D. Noll","orcid":"https://orcid.org/0000-0002-0176-2360"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Dennis Noll","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110777048","display_name":"Yannik Rath","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Yannik Rath","raw_affiliation_strings":["Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Physics Institute 3A, RWTH Aachen University, 52056, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5013254371"],"corresponding_institution_ids":["https://openalex.org/I887968799"],"apc_list":{"value":2590,"currency":"EUR","value_usd":3280},"apc_paid":{"value":2590,"currency":"EUR","value_usd":3280},"fwci":0.3935,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.58736408,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"7","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/terabyte","display_name":"Terabyte","score":0.9717621803283691},{"id":"https://openalex.org/keywords/large-hadron-collider","display_name":"Large Hadron Collider","score":0.8099865317344666},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7242810130119324},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6969985961914062},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5614771246910095},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5375217199325562},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.499509334564209},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.48594748973846436},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.4759516417980194},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.47275716066360474},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.41893765330314636},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.412993848323822},{"id":"https://openalex.org/keywords/particle-physics","display_name":"Particle physics","score":0.30819737911224365},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.2707497775554657},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.24990996718406677}],"concepts":[{"id":"https://openalex.org/C199683683","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Terabyte","level":2,"score":0.9717621803283691},{"id":"https://openalex.org/C87668248","wikidata":"https://www.wikidata.org/wiki/Q40605","display_name":"Large Hadron Collider","level":2,"score":0.8099865317344666},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7242810130119324},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6969985961914062},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5614771246910095},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5375217199325562},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.499509334564209},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.48594748973846436},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.4759516417980194},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.47275716066360474},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.41893765330314636},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.412993848323822},{"id":"https://openalex.org/C109214941","wikidata":"https://www.wikidata.org/wiki/Q18334","display_name":"Particle physics","level":1,"score":0.30819737911224365},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.2707497775554657},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.24990996718406677},{"id":"https://openalex.org/C188082640","wikidata":"https://www.wikidata.org/wiki/Q1780899","display_name":"Complementation","level":4,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C127716648","wikidata":"https://www.wikidata.org/wiki/Q104053","display_name":"Phenotype","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s41781-023-00095-9","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s41781-023-00095-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41781-023-00095-9.pdf","source":{"id":"https://openalex.org/S4210229695","display_name":"Computing and Software for Big Science","issn_l":"2510-2036","issn":["2510-2036","2510-2044"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Software for Big Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s41781-023-00095-9","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s41781-023-00095-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41781-023-00095-9.pdf","source":{"id":"https://openalex.org/S4210229695","display_name":"Computing and Software for Big Science","issn_l":"2510-2036","issn":["2510-2036","2510-2044"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Software for Big Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"},{"id":"https://openalex.org/F4320324232","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4360985465.pdf"},"referenced_works_count":8,"referenced_works":["https://openalex.org/W2973742427","https://openalex.org/W3035965352","https://openalex.org/W3098104888","https://openalex.org/W3099878876","https://openalex.org/W4230804723","https://openalex.org/W4300439692","https://openalex.org/W6912538520","https://openalex.org/W6969144114"],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W1976914335","https://openalex.org/W2164382479","https://openalex.org/W98480971","https://openalex.org/W2150291671","https://openalex.org/W2027972911","https://openalex.org/W2146343568","https://openalex.org/W2013643406","https://openalex.org/W2066858118","https://openalex.org/W2018090346"],"abstract_inverted_index":{"Abstract":[0],"The":[1],"development":[2],"of":[3,16,18,24,26,60,114,132,135],"an":[4,107,111,129],"LHC":[5],"physics":[6,46,104],"analysis":[7,28,105],"involves":[8],"numerous":[9],"investigations":[10],"that":[11],"require":[12],"the":[13,34,63,87,117,141],"repeated":[14],"processing":[15,59],"terabytes":[17],"data.":[19],"Thus,":[20],"a":[21,39,100,133],"rapid":[22],"completion":[23],"each":[25],"these":[27],"cycles":[29],"is":[30],"central":[31],"to":[32,41,77,145],"mastering":[33],"science":[35],"project.":[36],"We":[37],"present":[38],"solution":[40,53],"efficiently":[42,73],"handle":[43],"and":[44,72,94,127],"accelerate":[45],"analyses":[47],"on":[48,69,86],"small-size":[49],"institute":[50],"clusters.":[51],"Our":[52],"uses":[54],"three":[55],"key":[56,89],"concepts:":[57],"vectorized":[58],"collision":[61],"events,":[62],"\u201cMapReduce\u201d":[64],"paradigm":[65],"for":[66,119],"scaling":[67],"out":[68],"computing":[70],"clusters,":[71],"utilized":[74],"SSD":[75],"caching":[76],"reduce":[78],"latencies":[79],"in":[80,116],"IO":[81],"operations.":[82],"This":[83],"work":[84],"focuses":[85],"latter":[88],"concept,":[90],"its":[91,95],"underlying":[92],"mechanism,":[93],"implementation.":[96],"Using":[97],"simulations":[98],"from":[99,143],"Higgs":[101],"pair":[102],"production":[103],"as":[106],"example,":[108],"we":[109],"achieve":[110],"improvement":[112],"factor":[113,134],"6.3":[115],"runtime":[118,142],"reading":[120],"all":[121],"input":[122],"data":[123],"after":[124,137],"one":[125],"cycle":[126],"even":[128],"overall":[130],"speedup":[131],"14.9":[136],"10":[138],"cycles,":[139],"reducing":[140],"hours":[144],"minutes.":[146]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
