{"id":"https://openalex.org/W7134986595","doi":"https://doi.org/10.48550/arxiv.2603.09166","title":"Fast and Optimal Differentially Private Frequent-Substring Mining","display_name":"Fast and Optimal Differentially Private Frequent-Substring Mining","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134986595","doi":"https://doi.org/10.48550/arxiv.2603.09166"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09166","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09166","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09166","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128764730","display_name":"Peaker Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Peaker","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128742684","display_name":"Rayne Holland","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Holland, Rayne","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128714551","display_name":"Hao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.8288999795913696,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.8288999795913696,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.0803999975323677,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.010700000450015068,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substring","display_name":"Substring","score":0.8902000188827515},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.6722999811172485},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5324000120162964},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5016999840736389},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4203999936580658},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.39820000529289246},{"id":"https://openalex.org/keywords/subroutine","display_name":"Subroutine","score":0.3675000071525574},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.36559998989105225}],"concepts":[{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.8902000188827515},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.6722999811172485},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6281999945640564},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5324000120162964},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5016999840736389},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4537000060081482},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4203999936580658},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4050000011920929},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C96147967","wikidata":"https://www.wikidata.org/wiki/Q190686","display_name":"Subroutine","level":2,"score":0.3675000071525574},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.36559998989105225},{"id":"https://openalex.org/C190290938","wikidata":"https://www.wikidata.org/wiki/Q387015","display_name":"Trie","level":3,"score":0.3626999855041504},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32330000400543213},{"id":"https://openalex.org/C23130292","wikidata":"https://www.wikidata.org/wiki/Q5275358","display_name":"Differential privacy","level":2,"score":0.31299999356269836},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.30869999527931213},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27889999747276306},{"id":"https://openalex.org/C42747912","wikidata":"https://www.wikidata.org/wiki/Q1048447","display_name":"Multiplicative function","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2648000121116638},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09166","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09166","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09166","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09166","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Given":[0],"a":[1,13,36,59,98,110],"dataset":[2],"of":[3,8,48,101,119,127],"$n$":[4],"user-contributed":[5],"strings,":[6],"each":[7,25],"length":[9],"at":[10,44],"most":[11],"$\\ell$,":[12],"key":[14],"problem":[15],"is":[16],"how":[17],"to":[18,75,83],"identify":[19],"all":[20],"frequent":[21,120,147],"substrings":[22,103],"while":[23,71],"preserving":[24],"user's":[26],"privacy.":[27,152],"Recent":[28],"work":[29],"by":[30,132],"Bernardini":[31],"et":[32],"al.":[33],"(PODS'25)":[34],"introduced":[35],"$\\varepsilon$-differentially":[37,61],"private":[38,62],"algorithm":[39,63],"achieving":[40],"near-optimal":[41,68],"error,":[42],"but":[43,104],"the":[45,66,116,128,138],"prohibitive":[46],"cost":[47],"$O(n^2\\ell^4)$":[49],"space":[50,73,130],"and":[51,80,122,124],"processing":[52],"time.":[53],"In":[54],"this":[55],"work,":[56,144],"we":[57],"present":[58],"new":[60,107],"that":[64,114],"retains":[65],"same":[67],"error":[69],"guarantees":[70],"reducing":[72],"complexity":[74,82],"$O(n":[76,84],"\\ell+":[77],"|\u03a3|":[78,86,88],")$":[79],"time":[81],"\\ell\\log":[85],"+":[87],")$,":[89],"for":[90],"input":[91],"alphabet":[92],"$\u03a3$.":[93],"Our":[94],"approach":[95],"builds":[96],"on":[97],"top-down":[99],"exploration":[100],"candidate":[102],"introduces":[105],"two":[106],"innovations:":[108],"(i)":[109],"refined":[111],"candidate-generation":[112],"strategy":[113],"leverages":[115],"structural":[117],"properties":[118],"prefixes":[121],"suffixes,":[123],"(ii)":[125],"pruning":[126],"search":[129],"guided":[131],"frequency":[133],"relations.":[134],"These":[135],"techniques":[136],"eliminate":[137],"quadratic":[139],"blow-ups":[140],"inherent":[141],"in":[142],"prior":[143],"enabling":[145],"scalable":[146],"substring":[148],"mining":[149],"under":[150],"differential":[151]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-12T00:00:00"}
