{"id":"https://openalex.org/W4223892082","doi":"https://doi.org/10.1007/s41060-022-00320-5","title":"Accurate and efficient privacy-preserving string matching","display_name":"Accurate and efficient privacy-preserving string matching","publication_year":2022,"publication_date":"2022-04-13","ids":{"openalex":"https://openalex.org/W4223892082","doi":"https://doi.org/10.1007/s41060-022-00320-5"},"language":"en","primary_location":{"id":"doi:10.1007/s41060-022-00320-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41060-022-00320-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41060-022-00320-5.pdf","source":{"id":"https://openalex.org/S4210195017","display_name":"International Journal of Data Science and Analytics","issn_l":"2364-415X","issn":["2364-415X","2364-4168"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319972","host_organization_name":"Springer International Publishing","host_organization_lineage":["https://openalex.org/P4310319972","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer International Publishing","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Data Science and Analytics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s41060-022-00320-5.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048648969","display_name":"Sirintra Vaiwsri","orcid":"https://orcid.org/0000-0002-1391-6160"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Sirintra Vaiwsri","raw_affiliation_strings":["School of Computing, The Australian, National University, Canberra, ACT, 2600, Australia"],"raw_orcid":"https://orcid.org/0000-0002-1391-6160","affiliations":[{"raw_affiliation_string":"School of Computing, The Australian, National University, Canberra, ACT, 2600, Australia","institution_ids":["https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038468449","display_name":"Thilina Ranbaduge","orcid":"https://orcid.org/0000-0001-5405-3704"},"institutions":[{"id":"https://openalex.org/I42894916","display_name":"Data61","ror":"https://ror.org/03q397159","country_code":"AU","type":"other","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I42894916","https://openalex.org/I4387156119"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Thilina Ranbaduge","raw_affiliation_strings":["Data61, Black Mountain, Canberra, ACT, 2600, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Data61, Black Mountain, Canberra, ACT, 2600, Australia","institution_ids":["https://openalex.org/I42894916"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022945960","display_name":"Peter Christen","orcid":"https://orcid.org/0000-0003-3435-2015"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Peter Christen","raw_affiliation_strings":["School of Computing, The Australian, National University, Canberra, ACT, 2600, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computing, The Australian, National University, Canberra, ACT, 2600, Australia","institution_ids":["https://openalex.org/I118347636"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5048648969"],"corresponding_institution_ids":["https://openalex.org/I118347636"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":1.2486,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.82554443,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"14","issue":"2","first_page":"191","last_page":"215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.705010712146759},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7048617005348206},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.6819621920585632},{"id":"https://openalex.org/keywords/approximate-string-matching","display_name":"Approximate string matching","score":0.6427897214889526},{"id":"https://openalex.org/keywords/string-metric","display_name":"String metric","score":0.6400313973426819},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5478149056434631},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5454859733581543},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.476727157831192},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4575135111808777},{"id":"https://openalex.org/keywords/edit-distance","display_name":"Edit distance","score":0.4481014907360077},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4026668965816498},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.30869901180267334},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.262008398771286},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23976022005081177},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1808854639530182}],"concepts":[{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.705010712146759},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7048617005348206},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.6819621920585632},{"id":"https://openalex.org/C32610155","wikidata":"https://www.wikidata.org/wiki/Q1798621","display_name":"Approximate string matching","level":3,"score":0.6427897214889526},{"id":"https://openalex.org/C22820288","wikidata":"https://www.wikidata.org/wiki/Q9050568","display_name":"String metric","level":4,"score":0.6400313973426819},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5478149056434631},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5454859733581543},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.476727157831192},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4575135111808777},{"id":"https://openalex.org/C44359876","wikidata":"https://www.wikidata.org/wiki/Q5338467","display_name":"Edit distance","level":2,"score":0.4481014907360077},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4026668965816498},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.30869901180267334},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.262008398771286},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23976022005081177},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1808854639530182},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s41060-022-00320-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41060-022-00320-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41060-022-00320-5.pdf","source":{"id":"https://openalex.org/S4210195017","display_name":"International Journal of Data Science and Analytics","issn_l":"2364-415X","issn":["2364-415X","2364-4168"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319972","host_organization_name":"Springer International Publishing","host_organization_lineage":["https://openalex.org/P4310319972","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer International Publishing","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Data Science and Analytics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s41060-022-00320-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41060-022-00320-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41060-022-00320-5.pdf","source":{"id":"https://openalex.org/S4210195017","display_name":"International Journal of Data Science and Analytics","issn_l":"2364-415X","issn":["2364-415X","2364-4168"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319972","host_organization_name":"Springer International Publishing","host_organization_lineage":["https://openalex.org/P4310319972","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer International Publishing","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Data Science and Analytics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.800000011920929,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G4901731796","display_name":null,"funder_award_id":"DP160101934","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"}],"funders":[{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4223892082.pdf","grobid_xml":"https://content.openalex.org/works/W4223892082.grobid-xml"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W293439698","https://openalex.org/W1585665690","https://openalex.org/W1586468107","https://openalex.org/W1604639942","https://openalex.org/W1819119697","https://openalex.org/W1834151548","https://openalex.org/W1977056427","https://openalex.org/W1987562803","https://openalex.org/W1995875735","https://openalex.org/W2004957971","https://openalex.org/W2029128277","https://openalex.org/W2029948740","https://openalex.org/W2041936211","https://openalex.org/W2080389711","https://openalex.org/W2086751352","https://openalex.org/W2091014722","https://openalex.org/W2092071682","https://openalex.org/W2108834246","https://openalex.org/W2116025923","https://openalex.org/W2121252285","https://openalex.org/W2132069633","https://openalex.org/W2141965543","https://openalex.org/W2150926065","https://openalex.org/W2199404809","https://openalex.org/W2289049650","https://openalex.org/W2323506184","https://openalex.org/W2473182694","https://openalex.org/W2577090845","https://openalex.org/W2589250137","https://openalex.org/W2604123379","https://openalex.org/W2606710373","https://openalex.org/W2762887147","https://openalex.org/W2790563985","https://openalex.org/W2798841271","https://openalex.org/W2802266710","https://openalex.org/W2808633588","https://openalex.org/W2899702797","https://openalex.org/W2911978475","https://openalex.org/W2921249631","https://openalex.org/W2949524341","https://openalex.org/W3014048501","https://openalex.org/W3042518069","https://openalex.org/W3110895214","https://openalex.org/W3138898752","https://openalex.org/W3157379050","https://openalex.org/W3160027900","https://openalex.org/W3194621686","https://openalex.org/W4206009022","https://openalex.org/W4210754024","https://openalex.org/W4225249012","https://openalex.org/W4240908132","https://openalex.org/W4242373515","https://openalex.org/W4242744113"],"related_works":["https://openalex.org/W2399644331","https://openalex.org/W2405436873","https://openalex.org/W52396946","https://openalex.org/W1982055477","https://openalex.org/W2061135126","https://openalex.org/W4248804345","https://openalex.org/W1492858093","https://openalex.org/W2599240737","https://openalex.org/W2595827536","https://openalex.org/W1998140328"],"abstract_inverted_index":{"Abstract":[0],"The":[1,68],"task":[2],"of":[3,45,52,86,95,126,182,203],"calculating":[4],"similarities":[5],"between":[6],"strings":[7,15,82,105],"held":[8],"by":[9],"different":[10,104,201],"organisations":[11],"without":[12],"revealing":[13],"these":[14],"is":[16],"an":[17],"increasingly":[18],"important":[19],"problem":[20],"in":[21,83,171],"areas":[22],"such":[23],"as":[24,110],"health":[25],"informatics,":[26],"national":[27],"censuses,":[28],"genomics,":[29],"and":[30,80,144,205,210],"fraud":[31],"detection.":[32],"Most":[33],"existing":[34,119],"privacy-preserving":[35,70,87,146],"string":[36,147,184],"matching":[37,51,148],"approaches":[38,141,195],"are":[39,57,74],"either":[40],"based":[41],"on":[42,163,196],"comparing":[43],"sets":[44,199],"encoded":[46,53],"characters":[47],"allowing":[48],"only":[49],"exact":[50],"strings,":[54,169,204],"or":[55],"they":[56,219],"aimed":[58],"at":[59],"long":[60],"genomics":[61],"sequences":[62],"that":[63,73,149,218],"have":[64],"a":[65,100,111,183],"small":[66],"alphabet.":[67],"set-based":[69,120],"similarity":[71],"functions":[72],"commonly":[75],"used":[76],"to":[77,114,166,185,213],"compare":[78,167],"name":[79],"address":[81],"the":[84,93,124,127,156,172,180,187],"context":[85],"record":[88],"linkage":[89],"do":[90],"not":[91],"take":[92],"positions":[94],"sub-strings":[96,164,181],"into":[97],"account.":[98],"As":[99],"result,":[101],"two":[102,132,139],"very":[103],"can":[106],"potentially":[107],"be":[108],"considered":[109],"match":[112],"leading":[113],"wrongly":[115],"linked":[116],"records.":[117],"Furthermore,":[118],"techniques":[121],"cannot":[122],"identify":[123,186],"length":[125],"longest":[128,188],"common":[129,189],"sub-string":[130],"across":[131],"strings.":[133],"In":[134,155],"this":[135],"paper,":[136],"we":[137,159,175],"propose":[138],"new":[140],"for":[142],"accurate":[143],"efficient":[145],"provide":[150],"privacy":[151],"against":[152],"various":[153],"attacks.":[154],"first":[157],"approach":[158,174],"apply":[160],"hashing-based":[161],"encoding":[162],"(q-grams)":[165],"sensitive":[168],"while":[170],"second":[173],"generate":[176],"one-bit":[177],"array":[178],"from":[179],"bit":[190],"sequences.":[191],"We":[192],"evaluate":[193],"our":[194],"several":[197],"data":[198],"with":[200],"types":[202],"validate":[206],"their":[207],"privacy,":[208],"accuracy,":[209],"complexity":[211],"compared":[212],"three":[214],"baseline":[215],"techniques,":[216],"showing":[217],"outperform":[220],"all":[221],"baselines.":[222]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
