{"id":"https://openalex.org/W7154265911","doi":"https://doi.org/10.48550/arxiv.2604.10295","title":"Icicle: Scalable Metadata Indexing and Real-Time Monitoring for HPC File Systems","display_name":"Icicle: Scalable Metadata Indexing and Real-Time Monitoring for HPC File Systems","publication_year":2026,"publication_date":"2026-04-11","ids":{"openalex":"https://openalex.org/W7154265911","doi":"https://doi.org/10.48550/arxiv.2604.10295"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.10295","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10295","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.10295","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058211635","display_name":"Haochen Pan","orcid":"https://orcid.org/0009-0006-8992-5895"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Haochen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088145676","display_name":"Ryan Chard","orcid":"https://orcid.org/0000-0002-6781-7432"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chard, Ryan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105207290","display_name":"Song Young Oh","orcid":"https://orcid.org/0009-0005-4827-8014"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oh, Song Young","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001374377","display_name":"Maxime Gonthier","orcid":"https://orcid.org/0000-0003-3306-0483"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gonthier, Maxime","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133625686","display_name":"Val\u00e9rie Hayot-Sasson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hayot-Sasson, Val\u00e9rie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004843972","display_name":"Geoffrey Lentner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lentner, Geoffrey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104851825","display_name":"Joe Bottigliero","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bottigliero, Joe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009365131","display_name":"Rachana Ananthakrishnan","orcid":"https://orcid.org/0000-0002-2187-9988"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ananthakrishnan, Rachana","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065464552","display_name":"Kyle Chard","orcid":"https://orcid.org/0000-0002-7370-4805"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chard, Kyle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5032231503","display_name":"Ian Foster","orcid":"https://orcid.org/0000-0003-2129-5269"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Foster, Ian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.4366999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.4366999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.22689999639987946,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.05620000138878822,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.8083999752998352},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6718999743461609},{"id":"https://openalex.org/keywords/file-system","display_name":"File system","score":0.652899980545044},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.612500011920929},{"id":"https://openalex.org/keywords/lustre","display_name":"Lustre (file system)","score":0.5529000163078308},{"id":"https://openalex.org/keywords/distributed-file-system","display_name":"Distributed File System","score":0.46070000529289246},{"id":"https://openalex.org/keywords/journaling-file-system","display_name":"Journaling file system","score":0.43619999289512634},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.4318000078201294},{"id":"https://openalex.org/keywords/flat-file-database","display_name":"Flat file database","score":0.3783999979496002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8353000283241272},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8083999752998352},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6718999743461609},{"id":"https://openalex.org/C2780940931","wikidata":"https://www.wikidata.org/wiki/Q174989","display_name":"File system","level":2,"score":0.652899980545044},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.612500011920929},{"id":"https://openalex.org/C180699724","wikidata":"https://www.wikidata.org/wiki/Q1877782","display_name":"Lustre (file system)","level":3,"score":0.5529000163078308},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5378999710083008},{"id":"https://openalex.org/C152043487","wikidata":"https://www.wikidata.org/wiki/Q1229600","display_name":"Distributed File System","level":2,"score":0.46070000529289246},{"id":"https://openalex.org/C2225880","wikidata":"https://www.wikidata.org/wiki/Q579047","display_name":"Journaling file system","level":3,"score":0.43619999289512634},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.4318000078201294},{"id":"https://openalex.org/C201743585","wikidata":"https://www.wikidata.org/wiki/Q1373925","display_name":"Flat file database","level":5,"score":0.3783999979496002},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.37400001287460327},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.35440000891685486},{"id":"https://openalex.org/C13600138","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Petabyte","level":3,"score":0.35199999809265137},{"id":"https://openalex.org/C2779489174","wikidata":"https://www.wikidata.org/wiki/Q6822246","display_name":"Metadata management","level":3,"score":0.34779998660087585},{"id":"https://openalex.org/C95637964","wikidata":"https://www.wikidata.org/wiki/Q82753","display_name":"Computer file","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C88548561","wikidata":"https://www.wikidata.org/wiki/Q347599","display_name":"sort","level":2,"score":0.3264999985694885},{"id":"https://openalex.org/C82820731","wikidata":"https://www.wikidata.org/wiki/Q2640620","display_name":"Self-certifying File System","level":3,"score":0.32409998774528503},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C70388272","wikidata":"https://www.wikidata.org/wiki/Q5968558","display_name":"IBM","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.30250000953674316},{"id":"https://openalex.org/C59276292","wikidata":"https://www.wikidata.org/wiki/Q580427","display_name":"Database index","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.29679998755455017},{"id":"https://openalex.org/C2212953","wikidata":"https://www.wikidata.org/wiki/Q948454","display_name":"Transaction log","level":3,"score":0.27300000190734863},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C40350719","wikidata":"https://www.wikidata.org/wiki/Q2451637","display_name":"Torrent file","level":4,"score":0.25850000977516174},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.10295","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10295","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.10295","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10295","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"HPC":[1,170],"file":[2,24,67,82,137],"systems":[3,103],"can":[4],"contain":[5],"billions":[6,162],"of":[7,11,13,81,126,163],"files":[8],"and":[9,30,44,52,71,78,95,107,115,122,139,146,158,179,189],"hundreds":[10],"petabytes":[12],"data,":[14],"making":[15],"even":[16],"simple":[17],"questions":[18],"increasingly":[19],"intractable":[20],"to":[21,33,35],"answer.":[22],"Traditional":[23],"system":[25,68,83],"utilities":[26],"such":[27,104],"as":[28,105],"find":[29],"du":[31],"fail":[32],"scale":[34],"these":[36],"sizes.":[37],"While":[38],"external":[39],"indexing":[40,70,180],"tools":[41],"like":[42],"GUFI":[43],"Brindexer":[45],"improve":[46],"query":[47],"performance,":[48],"they":[49],"remain":[50],"batch-oriented":[51],"unsuitable":[53],"for":[54,65,91,98,153,185],"heterogeneous,":[55],"rapidly":[56],"evolving":[57],"environments.":[58],"We":[59],"present":[60],"Icicle,":[61],"a":[62,75],"scalable":[63,124],"framework":[64],"continuous":[66],"metadata":[69,93,127,190],"monitoring.":[72],"Icicle":[73,118],"maintains":[74],"unified,":[76],"up-to-date,":[77],"queryable":[79],"view":[80],"state":[84],"while":[85],"supporting":[86],"both":[87,135,154],"periodic":[88],"snapshot-based":[89],"ingestion":[90,97,125],"bulk":[92],"updates":[94],"event-based":[96],"real-time":[99],"synchronization":[100],"from":[101],"production":[102],"Lustre":[106],"IBM":[108],"Storage":[109],"Scale.":[110],"Built":[111],"on":[112,168],"Apache":[113,116],"Kafka":[114],"Flink,":[117],"provides":[119],"high-throughput,":[120],"fault-tolerant,":[121],"horizontally":[123],"events":[128],"into":[129],"two":[130],"complementary":[131],"search":[132],"indexes,":[133],"enabling":[134],"individual":[136],"discovery":[138],"aggregate":[140],"summary":[141],"statistics":[142],"by":[143],"user,":[144],"group,":[145],"directory.":[147],"This":[148],"architecture":[149],"enables":[150],"efficient":[151],"support":[152],"coarse-grained":[155],"administrative":[156],"queries":[157],"interactive":[159],"analytics":[160],"over":[161,176],"objects.":[164],"Our":[165],"experimental":[166],"evaluation":[167],"production-scale":[169],"datasets":[171],"demonstrates":[172],"order-of-magnitude":[173],"throughput":[174],"improvements":[175],"existing":[177],"monitoring":[178],"approaches,":[181],"with":[182],"tunable":[183],"options":[184],"balancing":[186],"consistency,":[187],"latency,":[188],"freshness.":[191]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-15T00:00:00"}
