{"id":"https://openalex.org/W2616732338","doi":"https://doi.org/10.1109/icde.2017.50","title":"SF-sketch: A Fast, Accurate, and Memory Efficient Data Structure to Store Frequencies of Data Items","display_name":"SF-sketch: A Fast, Accurate, and Memory Efficient Data Structure to Store Frequencies of Data Items","publication_year":2017,"publication_date":"2017-04-01","ids":{"openalex":"https://openalex.org/W2616732338","doi":"https://doi.org/10.1109/icde.2017.50","mag":"2616732338"},"language":"en","primary_location":{"id":"doi:10.1109/icde.2017.50","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2017.50","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 33rd International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069277955","display_name":"Tong Yang","orcid":"https://orcid.org/0000-0003-2402-5854"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tong Yang","raw_affiliation_strings":["Collaborative Innovation Center of High Performance Computing, NUDT, Chanzsha, China","Peking University, China"],"affiliations":[{"raw_affiliation_string":"Collaborative Innovation Center of High Performance Computing, NUDT, Chanzsha, China","institution_ids":[]},{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103240439","display_name":"Lingtong Liu","orcid":"https://orcid.org/0000-0001-8178-6030"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingtong Liu","raw_affiliation_strings":["Xidian University, China"],"affiliations":[{"raw_affiliation_string":"Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035494207","display_name":"Yibo Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibo Yan","raw_affiliation_strings":["Peking University, China"],"affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049422969","display_name":"Muhammad Shahzad","orcid":"https://orcid.org/0000-0003-4342-7875"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Muhammad Shahzad","raw_affiliation_strings":["North Carolina State University, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043356063","display_name":"Yulong Shen","orcid":"https://orcid.org/0000-0002-8448-705X"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yulong Shen","raw_affiliation_strings":["Xidian University, China"],"affiliations":[{"raw_affiliation_string":"Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100452115","display_name":"Xiaoming Li","orcid":"https://orcid.org/0000-0001-7122-3779"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoming Li","raw_affiliation_strings":["Peking University, China"],"affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062357883","display_name":"Bin Cui","orcid":"https://orcid.org/0000-0003-1681-4677"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Cui","raw_affiliation_strings":["Peking University, China"],"affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030689390","display_name":"Gaogang Xie","orcid":"https://orcid.org/0000-0003-4964-1135"},"institutions":[{"id":"https://openalex.org/I4210101410","display_name":"International Centre for Theoretical Physics Asia-Pacific","ror":"https://ror.org/01z2px678","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210101410","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaogang Xie","raw_affiliation_strings":["ICT, China"],"affiliations":[{"raw_affiliation_string":"ICT, China","institution_ids":["https://openalex.org/I4210101410"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5069277955"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":4.1261,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.94682895,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"103","last_page":"106"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.9802271127700806},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8189126253128052},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.6485735177993774},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6260169744491577},{"id":"https://openalex.org/keywords/footprint","display_name":"Footprint","score":0.5294610857963562},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4944324493408203},{"id":"https://openalex.org/keywords/sketch-recognition","display_name":"Sketch recognition","score":0.4861395061016083},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.4574948251247406},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4375465512275696},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.41644641757011414},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.39788541197776794},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.390170156955719},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36351823806762695},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.20670494437217712},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15488478541374207}],"concepts":[{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.9802271127700806},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8189126253128052},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.6485735177993774},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6260169744491577},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.5294610857963562},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4944324493408203},{"id":"https://openalex.org/C132900626","wikidata":"https://www.wikidata.org/wiki/Q7534733","display_name":"Sketch recognition","level":4,"score":0.4861395061016083},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.4574948251247406},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4375465512275696},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41644641757011414},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.39788541197776794},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.390170156955719},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36351823806762695},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20670494437217712},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15488478541374207},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.0},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icde.2017.50","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2017.50","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 33rd International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1493892051","https://openalex.org/W1562125942","https://openalex.org/W1974466705","https://openalex.org/W1985229168","https://openalex.org/W2080222256","https://openalex.org/W2080234606","https://openalex.org/W2104100926","https://openalex.org/W2107443258","https://openalex.org/W2142269587","https://openalex.org/W2142808699","https://openalex.org/W2199464493","https://openalex.org/W2588188671","https://openalex.org/W4205471522","https://openalex.org/W4206137901","https://openalex.org/W4249843299","https://openalex.org/W4254091566","https://openalex.org/W6629496199","https://openalex.org/W6676268515"],"related_works":["https://openalex.org/W2294900353","https://openalex.org/W2411243951","https://openalex.org/W2151314278","https://openalex.org/W1971224820","https://openalex.org/W13629514","https://openalex.org/W2963977451","https://openalex.org/W2098836165","https://openalex.org/W1976890290","https://openalex.org/W1573697454","https://openalex.org/W2966897482"],"abstract_inverted_index":{"A":[0],"sketch":[1,78,84],"is":[2,8,70,96,142],"a":[3,16,23,44,53,76,82],"probabilistic":[4],"data":[5,29,36],"structure":[6],"that":[7,126],"used":[9,97,133],"to":[10,71,98],"record":[11],"frequencies":[12],"of":[13,25,137],"items":[14],"in":[15,22,135],"multi-set.":[17],"Sketches":[18],"have":[19],"been":[20],"applied":[21],"variety":[24],"fields,":[26],"such":[27],"as":[28],"stream":[30],"processing,":[31,34],"natural":[32],"language":[33],"distributed":[35],"sets":[37],"etc.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42],"propose":[43],"new":[45],"sketch,":[46,50],"called":[47,79,85],"Slim-Fat":[48],"(SF)":[49],"which":[51],"has":[52],"much":[54],"smaller":[55],"memory":[56],"footprint":[57],"for":[58],"query":[59],"while":[60],"supporting":[61],"updates.":[62],"The":[63,87,94,139],"key":[64],"idea":[65],"behind":[66],"our":[67],"proposed":[68],"SF-sketch":[69,110,127],"maintain":[72],"two":[73],"separate":[74],"sketches:":[75],"small":[77],"Slimsubsketch":[80,88],"and":[81,91,102,108,116],"large":[83],"Fat-subsketch.":[86],"enables":[89],"fast":[90],"accurate":[92],"querying.":[93],"Fat-subsketch":[95],"assist":[99],"the":[100,130],"insertion":[101],"deletion":[103],"from":[104],"Slim-subsketch.":[105],"We":[106],"implemented":[107],"evaluated":[109],"along":[111],"with":[112],"several":[113],"prior":[114],"sketches":[115],"compared":[117],"them":[118],"side":[119],"by":[120],"side.":[121],"Our":[122],"experimental":[123],"results":[124],"show":[125],"significantly":[128],"outperforms":[129],"most":[131],"commonly":[132],"CM-sketch":[134],"terms":[136],"accuracy.":[138],"full":[140],"version":[141],"provided":[143],"at":[144],"arXiv.org":[145],"[12].":[146]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
