{"id":"https://openalex.org/W1724849505","doi":"https://doi.org/10.1007/978-3-319-11257-2_20","title":"A Comparison of Blocking Methods for Record Linkage","display_name":"A Comparison of Blocking Methods for Record Linkage","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W1724849505","doi":"https://doi.org/10.1007/978-3-319-11257-2_20","mag":"1724849505"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-319-11257-2_20","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-319-11257-2_20","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048743195","display_name":"Rebecca C. Steorts","orcid":"https://orcid.org/0000-0003-0114-8181"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Rebecca C. Steorts","raw_affiliation_strings":["Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033891696","display_name":"Samuel Ventura","orcid":"https://orcid.org/0000-0002-4178-2921"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samuel L. Ventura","raw_affiliation_strings":["Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038833573","display_name":"Mauricio Sadinle","orcid":"https://orcid.org/0000-0002-7092-3877"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mauricio Sadinle","raw_affiliation_strings":["Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108604141","display_name":"Stephen E. Fienberg","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stephen E. Fienberg","raw_affiliation_strings":["Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, Carnegie Mellon University, Pittsburgh, PA, U.S.A., 15213","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5048743195"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":18.1626,"has_fulltext":false,"cited_by_count":118,"citation_normalized_percentile":{"value":0.99384443,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"253","last_page":"268"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8335480690002441},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.7588084936141968},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.645276665687561},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.576668381690979},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.5701277852058411},{"id":"https://openalex.org/keywords/record-linkage","display_name":"Record linkage","score":0.4946129024028778},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.4737188220024109},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.4513954818248749},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.43416115641593933},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3980602025985718},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3717961311340332},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21388232707977295},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.1859196126461029},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.0891343355178833},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.08197575807571411},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07513770461082458}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8335480690002441},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.7588084936141968},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.645276665687561},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.576668381690979},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.5701277852058411},{"id":"https://openalex.org/C142210648","wikidata":"https://www.wikidata.org/wiki/Q1266546","display_name":"Record linkage","level":3,"score":0.4946129024028778},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.4737188220024109},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.4513954818248749},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.43416115641593933},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3980602025985718},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3717961311340332},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21388232707977295},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.1859196126461029},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0891343355178833},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.08197575807571411},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07513770461082458},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-319-11257-2_20","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-319-11257-2_20","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W31058924","https://openalex.org/W131624900","https://openalex.org/W198157877","https://openalex.org/W1518784700","https://openalex.org/W1547556487","https://openalex.org/W1736726159","https://openalex.org/W1916258859","https://openalex.org/W2013909137","https://openalex.org/W2031250218","https://openalex.org/W2032005951","https://openalex.org/W2036216970","https://openalex.org/W2047940964","https://openalex.org/W2059139185","https://openalex.org/W2095029525","https://openalex.org/W2102763740","https://openalex.org/W2105016630","https://openalex.org/W2127048411","https://openalex.org/W2159481891","https://openalex.org/W2183685420","https://openalex.org/W2539180806","https://openalex.org/W2792631716","https://openalex.org/W3084924609","https://openalex.org/W3102641634"],"related_works":["https://openalex.org/W4378651134","https://openalex.org/W1979633005","https://openalex.org/W2352307597","https://openalex.org/W2163724607","https://openalex.org/W2989796854","https://openalex.org/W2911599090","https://openalex.org/W2548183822","https://openalex.org/W4294243532","https://openalex.org/W2033159440","https://openalex.org/W2141965543"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":17},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":19},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":1}],"updated_date":"2026-04-27T08:22:11.395708","created_date":"2025-10-10T00:00:00"}
