{"id":"https://openalex.org/W4385270442","doi":"https://doi.org/10.1109/icde55515.2023.00009","title":"HyperCalm Sketch: One-Pass Mining Periodic Batches in Data Streams","display_name":"HyperCalm Sketch: One-Pass Mining Periodic Batches in Data Streams","publication_year":2023,"publication_date":"2023-04-01","ids":{"openalex":"https://openalex.org/W4385270442","doi":"https://doi.org/10.1109/icde55515.2023.00009"},"language":"en","primary_location":{"id":"doi:10.1109/icde55515.2023.00009","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde55515.2023.00009","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 39th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101916543","display_name":"Zirui Liu","orcid":"https://orcid.org/0000-0001-9062-6565"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zirui Liu","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067395122","display_name":"Chaozhe Kong","orcid":"https://orcid.org/0000-0001-8232-8680"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaozhe Kong","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061907296","display_name":"Kai-Cheng Yang","orcid":"https://orcid.org/0000-0001-6381-4026"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaicheng Yang","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069277955","display_name":"Tong Yang","orcid":"https://orcid.org/0000-0003-2402-5854"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Yang","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","Peng Cheng Laboratory, Shenzhen, China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026587300","display_name":"Ruijie Miao","orcid":"https://orcid.org/0000-0002-7266-8064"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruijie Miao","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102973444","display_name":"Qizhi Chen","orcid":"https://orcid.org/0009-0004-4020-6772"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qizhi Chen","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048093695","display_name":"Yikai Zhao","orcid":"https://orcid.org/0000-0003-2495-7774"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yikai Zhao","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034300662","display_name":"Yaofeng Tu","orcid":"https://orcid.org/0000-0002-2616-2273"},"institutions":[{"id":"https://openalex.org/I75746372","display_name":"ZTE (United States)","ror":"https://ror.org/0518yg160","country_code":"US","type":"company","lineage":["https://openalex.org/I4210098582","https://openalex.org/I75746372"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yaofeng Tu","raw_affiliation_strings":["ZTE Corporation"],"affiliations":[{"raw_affiliation_string":"ZTE Corporation","institution_ids":["https://openalex.org/I75746372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062357883","display_name":"Bin Cui","orcid":"https://orcid.org/0000-0003-1681-4677"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Cui","raw_affiliation_strings":["Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application,Beijing,China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, and National Engineering Laboratory for Big Data Analysis Technology and Application, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5101916543"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":2.8128,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.91072873,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"14","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.8413470983505249},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7665113210678101},{"id":"https://openalex.org/keywords/bloom-filter","display_name":"Bloom filter","score":0.7232968807220459},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.5538896322250366},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4690188765525818},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.4459201693534851},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.44315534830093384},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4186367988586426},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40679800510406494},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.2457188367843628},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10162040591239929}],"concepts":[{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.8413470983505249},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7665113210678101},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.7232968807220459},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.5538896322250366},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4690188765525818},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.4459201693534851},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.44315534830093384},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4186367988586426},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40679800510406494},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.2457188367843628},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10162040591239929},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icde55515.2023.00009","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde55515.2023.00009","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 39th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W206179863","https://openalex.org/W1675727887","https://openalex.org/W2012549717","https://openalex.org/W2044023374","https://openalex.org/W2080234606","https://openalex.org/W2123845384","https://openalex.org/W2124897521","https://openalex.org/W2126884435","https://openalex.org/W2143198762","https://openalex.org/W2152706145","https://openalex.org/W2155095613","https://openalex.org/W2389126562","https://openalex.org/W2439904216","https://openalex.org/W2517662914","https://openalex.org/W2566979091","https://openalex.org/W2767867000","https://openalex.org/W2798870428","https://openalex.org/W2798945787","https://openalex.org/W2809244162","https://openalex.org/W2916816487","https://openalex.org/W2944916577","https://openalex.org/W2962979766","https://openalex.org/W2963458398","https://openalex.org/W2963898466","https://openalex.org/W2965206958","https://openalex.org/W2979352525","https://openalex.org/W3007098654","https://openalex.org/W3011389351","https://openalex.org/W3013442081","https://openalex.org/W3080109618","https://openalex.org/W3106272338","https://openalex.org/W3169567991","https://openalex.org/W3170032932","https://openalex.org/W3170078628","https://openalex.org/W3173768992","https://openalex.org/W3174641525","https://openalex.org/W3176186668","https://openalex.org/W3176348316","https://openalex.org/W3177067869","https://openalex.org/W4249843299","https://openalex.org/W4254155307","https://openalex.org/W4289533821","https://openalex.org/W4289533971","https://openalex.org/W4385270464","https://openalex.org/W6608493259","https://openalex.org/W6682883714","https://openalex.org/W6726523432","https://openalex.org/W6731596640","https://openalex.org/W6769284620"],"related_works":["https://openalex.org/W2086572746","https://openalex.org/W2604468458","https://openalex.org/W2157216338","https://openalex.org/W121740227","https://openalex.org/W1662107788","https://openalex.org/W2378994405","https://openalex.org/W3082379938","https://openalex.org/W2135966669","https://openalex.org/W2385974820","https://openalex.org/W2594143027"],"abstract_inverted_index":{"Batch":[0],"is":[1,65],"an":[2,123],"important":[3,66],"pattern":[4],"in":[5,67,97,155,163],"data":[6],"streams,":[7],"which":[8,89],"refers":[9,49],"to":[10,50,93,112,131,171],"a":[11,38,81,105,172],"group":[12,45],"of":[13,29,46,53,116,157,165],"identical":[14],"items":[15],"that":[16,21,25],"arrive":[17,26,60],"closely.":[18],"We":[19,79,136,167],"find":[20],"some":[22],"special":[23],"batches":[24,48,52,59,64,96],"periodically":[27],"are":[28,184],"great":[30],"value.":[31],"In":[32,100,118],"this":[33],"paper,":[34],"we":[35,103,121],"formally":[36],"define":[37],"new":[39],"pattern,":[40],"namely":[41,85,109],"periodic":[42,47,63,95,134],"batches.":[43,117,135],"A":[44],"several":[51],"the":[54,86,114,139,151],"same":[55],"item,":[56],"where":[57],"these":[58],"periodically.":[61],"Studying":[62],"many":[68],"applications,":[69],"such":[70],"as":[71],"caches,":[72],"financial":[73],"markets,":[74],"online":[75],"advertisements,":[76],"networks,":[77],"etc.":[78],"propose":[80,104,122],"one-pass":[82],"sketching":[83],"algorithm,":[84,126],"HyperCalm":[87,149,170,177],"sketch,":[88],"takes":[90],"two":[91],"phases":[92],"detect":[94,113],"real":[98],"time.":[99],"phase":[101,119],"1,":[102],"time-aware":[106],"Bloom":[107],"filter,":[108],"HyperBloomFilter":[110],"(HyperBF),":[111],"start":[115],"2,":[120],"enhanced":[124],"top-k":[125,133],"called":[127],"Calm":[128],"Space-Saving":[129],"(CalmSS),":[130],"report":[132],"theoretically":[137],"derive":[138],"error":[140,160],"bounds":[141],"for":[142],"HyperBF":[143],"and":[144,161,175],"CalmSS.":[145],"Extensive":[146],"experiments":[147],"show":[148],"outperforms":[150],"strawman":[152],"solutions":[153],"4\u00d7":[154],"term":[156,164],"average":[158],"relative":[159],"13.2\u00d7":[162],"speed.":[166],"also":[168],"apply":[169],"cache":[173],"system":[174],"integrate":[176],"into":[178],"Apache":[179],"Flink.":[180],"All":[181],"related":[182],"codes":[183],"open-sourced.":[185]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
