{"id":"https://openalex.org/W2093763734","doi":"https://doi.org/10.1145/2699026.2699106","title":"Privacy-Preserving Scanning of Big Content for Sensitive Data Exposure with MapReduce","display_name":"Privacy-Preserving Scanning of Big Content for Sensitive Data Exposure with MapReduce","publication_year":2015,"publication_date":"2015-02-23","ids":{"openalex":"https://openalex.org/W2093763734","doi":"https://doi.org/10.1145/2699026.2699106","mag":"2093763734"},"language":"en","primary_location":{"id":"doi:10.1145/2699026.2699106","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2699026.2699106","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th ACM Conference on Data and Application Security and Privacy","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100453118","display_name":"Fang Liu","orcid":"https://orcid.org/0000-0003-2412-9768"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fang Liu","raw_affiliation_strings":["Virginia Tech, Blacksburg, VA, USA","Virginia Tech, , Blacksburg, VA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech, Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]},{"raw_affiliation_string":"Virginia Tech, , Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046558241","display_name":"Xiaokui Shu","orcid":"https://orcid.org/0000-0002-7381-7041"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaokui Shu","raw_affiliation_strings":["Virginia Tech, Blacksburg, VA, USA","Virginia Tech, , Blacksburg, VA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech, Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]},{"raw_affiliation_string":"Virginia Tech, , Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034366344","display_name":"Danfeng Yao","orcid":"https://orcid.org/0000-0001-8969-2792"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Danfeng Yao","raw_affiliation_strings":["Virginia Tech, Blacksburg, VA, USA","Virginia Tech, , Blacksburg, VA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech, Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]},{"raw_affiliation_string":"Virginia Tech, , Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013454209","display_name":"Ali R. Butt","orcid":"https://orcid.org/0000-0002-0871-7263"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ali R. Butt","raw_affiliation_strings":["Virginia Tech, Blacksburg, VA, USA","Virginia Tech, , Blacksburg, VA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech, Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]},{"raw_affiliation_string":"Virginia Tech, , Blacksburg, VA, USA","institution_ids":["https://openalex.org/I859038795"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":24.7371,"has_fulltext":false,"cited_by_count":57,"citation_normalized_percentile":{"value":0.99382847,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"195","last_page":"206"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10388","display_name":"Advanced Steganography and Watermarking Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8536024689674377},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7053558826446533},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.595942497253418},{"id":"https://openalex.org/keywords/outsourcing","display_name":"Outsourcing","score":0.5707101225852966},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4889325201511383},{"id":"https://openalex.org/keywords/volume","display_name":"Volume (thermodynamics)","score":0.47256606817245483},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.4353603720664978},{"id":"https://openalex.org/keywords/information-privacy","display_name":"Information privacy","score":0.41956713795661926},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3636365234851837},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.35791414976119995},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.34009960293769836},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.30062007904052734},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.17485672235488892}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8536024689674377},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7053558826446533},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.595942497253418},{"id":"https://openalex.org/C46934059","wikidata":"https://www.wikidata.org/wiki/Q61515","display_name":"Outsourcing","level":2,"score":0.5707101225852966},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4889325201511383},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.47256606817245483},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.4353603720664978},{"id":"https://openalex.org/C123201435","wikidata":"https://www.wikidata.org/wiki/Q456632","display_name":"Information privacy","level":2,"score":0.41956713795661926},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3636365234851837},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.35791414976119995},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.34009960293769836},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.30062007904052734},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.17485672235488892},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/2699026.2699106","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2699026.2699106","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th ACM Conference on Data and Application Security and Privacy","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.705.1956","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.705.1956","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://people.cs.vt.edu/danfeng/papers/DLD-MapReduce-CODASPY-15.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.882.8085","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.882.8085","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://vtechworks.lib.vt.edu/bitstream/handle/10919/51271/hadoop-DLD.pdf%3Bjsessionid%3DED46DBF20325B57D72F1B3ACA5D8A329?sequence%3D4","raw_type":"text"},{"id":"pmh:oai:vtechworks.lib.vt.edu:10919/51271","is_oa":false,"landing_page_url":"http://hdl.handle.net/10919/51271","pdf_url":null,"source":{"id":"https://openalex.org/S4306400248","display_name":"VTechWorks (Virginia Tech)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I859038795","host_organization_name":"Virginia Tech","host_organization_lineage":["https://openalex.org/I859038795"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W66333431","https://openalex.org/W139488912","https://openalex.org/W192814132","https://openalex.org/W196977431","https://openalex.org/W205715760","https://openalex.org/W1451710050","https://openalex.org/W1491237615","https://openalex.org/W1590597681","https://openalex.org/W1593657937","https://openalex.org/W1969838337","https://openalex.org/W1970567146","https://openalex.org/W1986824012","https://openalex.org/W1987650093","https://openalex.org/W1990089904","https://openalex.org/W2020820745","https://openalex.org/W2022458254","https://openalex.org/W2032389920","https://openalex.org/W2040722314","https://openalex.org/W2043099794","https://openalex.org/W2061445336","https://openalex.org/W2077699053","https://openalex.org/W2086185540","https://openalex.org/W2088826400","https://openalex.org/W2107461003","https://openalex.org/W2114996745","https://openalex.org/W2116762767","https://openalex.org/W2119028650","https://openalex.org/W2125816831","https://openalex.org/W2127757034","https://openalex.org/W2131229759","https://openalex.org/W2131772137","https://openalex.org/W2132399973","https://openalex.org/W2137139422","https://openalex.org/W2139605600","https://openalex.org/W2143087446","https://openalex.org/W2148885851","https://openalex.org/W2150115633","https://openalex.org/W2151930506","https://openalex.org/W2163738013","https://openalex.org/W2173213060","https://openalex.org/W2215904967","https://openalex.org/W2350778671","https://openalex.org/W2545374358","https://openalex.org/W2913264117","https://openalex.org/W4255673994"],"related_works":["https://openalex.org/W2358200898","https://openalex.org/W2325765407","https://openalex.org/W618293728","https://openalex.org/W2291845669","https://openalex.org/W2788012436","https://openalex.org/W200604156","https://openalex.org/W4231184955","https://openalex.org/W2374784346","https://openalex.org/W4286615217","https://openalex.org/W3154723744"],"abstract_inverted_index":{"The":[0],"exposure":[1,128],"of":[2,34,129,141],"sensitive":[3,31,62,130],"data":[4,39,93,117,131,143],"in":[5],"storage":[6,26],"and":[7,15,38,72,149],"transmission":[8],"poses":[9],"a":[10,42,50,114],"serious":[11],"threat":[12],"to":[13,46,69,125,146],"organizational":[14],"personal":[16],"security.":[17],"Data":[18],"leak":[19,94,144],"detection":[20,145],"aims":[21],"at":[22],"scanning":[23],"content":[24,37],"(in":[25],"or":[27],"transmission)":[28],"for":[29,49,59,76,88,92],"exposed":[30,61],"data.":[32],"Because":[33],"the":[35,56,67,77,100,122,127,133,138,142],"large":[36],"volume,":[40],"such":[41,79],"screening":[43],"algorithm":[44],"needs":[45],"be":[47],"scalable":[48],"timely":[51],"detection.":[52,95,134],"Our":[53,96,111],"solution":[54],"uses":[55],"MapReduce":[57,86,148],"framework":[58],"detecting":[60],"content,":[63],"because":[64],"it":[65],"has":[66],"ability":[68],"arbitrarily":[70],"scale":[71],"utilize":[73],"public":[74],"resources":[75],"task,":[78],"as":[80],"Amazon":[81],"EC2.":[82],"We":[83],"design":[84],"new":[85],"algorithms":[87,112],"computing":[89],"collection":[90],"intersection":[91],"prototype":[97],"implemented":[98],"with":[99,108],"Hadoop":[101],"system":[102],"achieves":[103],"225":[104],"Mbps":[105],"analysis":[106],"throughput":[107],"24":[109],"nodes.":[110],"support":[113],"useful":[115],"privacy-preserving":[116,123],"transformation.":[118],"This":[119,135],"transformation":[120,136],"enables":[121],"technique":[124],"minimize":[126],"during":[132],"supports":[137],"secure":[139],"outsourcing":[140],"untrusted":[147],"cloud":[150],"providers.":[151]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":11},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
