{"id":"https://openalex.org/W2058733945","doi":"https://doi.org/10.1007/s00450-011-0177-x","title":"Multi-pass sorted neighborhood blocking with MapReduce","display_name":"Multi-pass sorted neighborhood blocking with MapReduce","publication_year":2011,"publication_date":"2011-05-17","ids":{"openalex":"https://openalex.org/W2058733945","doi":"https://doi.org/10.1007/s00450-011-0177-x","mag":"2058733945"},"language":"en","primary_location":{"id":"doi:10.1007/s00450-011-0177-x","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00450-011-0177-x","pdf_url":null,"source":{"id":"https://openalex.org/S22130598","display_name":"Computer Science - Research and Development","issn_l":"1865-2034","issn":["1865-2034","1865-2042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computer Science - Research and Development","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089424078","display_name":"Lars Kolb","orcid":null},"institutions":[{"id":"https://openalex.org/I926574661","display_name":"Leipzig University","ror":"https://ror.org/03s7gtk40","country_code":"DE","type":"education","lineage":["https://openalex.org/I926574661"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Lars Kolb","raw_affiliation_strings":["Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","institution_ids":["https://openalex.org/I926574661"]},{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#","institution_ids":["https://openalex.org/I926574661"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015557906","display_name":"Andreas Thor","orcid":"https://orcid.org/0000-0003-2575-2893"},"institutions":[{"id":"https://openalex.org/I926574661","display_name":"Leipzig University","ror":"https://ror.org/03s7gtk40","country_code":"DE","type":"education","lineage":["https://openalex.org/I926574661"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Andreas Thor","raw_affiliation_strings":["Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","institution_ids":["https://openalex.org/I926574661"]},{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#","institution_ids":["https://openalex.org/I926574661"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075756237","display_name":"Erhard Rahm","orcid":"https://orcid.org/0000-0002-2665-1114"},"institutions":[{"id":"https://openalex.org/I926574661","display_name":"Leipzig University","ror":"https://ror.org/03s7gtk40","country_code":"DE","type":"education","lineage":["https://openalex.org/I926574661"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Erhard Rahm","raw_affiliation_strings":["Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, PF 100920, 04009, Leipzig, Germany","institution_ids":["https://openalex.org/I926574661"]},{"raw_affiliation_string":"Institut f\u00fcr Informatik, Fakult\u00e4t f\u00fcr Mathematik und Informatik, Universit\u00e4t Leipzig, Leipzig, Germany 04009#TAB#","institution_ids":["https://openalex.org/I926574661"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5089424078"],"corresponding_institution_ids":["https://openalex.org/I926574661"],"apc_list":null,"apc_paid":null,"fwci":9.3138,"has_fulltext":false,"cited_by_count":80,"citation_normalized_percentile":{"value":0.97992861,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"27","issue":"1","first_page":"45","last_page":"63"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9805999994277954,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9778000116348267,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8966752886772156},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.7541805505752563},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.6257208585739136},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.6073015928268433},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5938519835472107},{"id":"https://openalex.org/keywords/sorting","display_name":"Sorting","score":0.5106428265571594},{"id":"https://openalex.org/keywords/replication","display_name":"Replication (statistics)","score":0.49455806612968445},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.479796439409256},{"id":"https://openalex.org/keywords/execution-time","display_name":"Execution time","score":0.4130600094795227},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14820444583892822},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.12099277973175049},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.07548418641090393}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8966752886772156},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.7541805505752563},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.6257208585739136},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.6073015928268433},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5938519835472107},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.5106428265571594},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.49455806612968445},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.479796439409256},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.4130600094795227},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14820444583892822},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.12099277973175049},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.07548418641090393},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s00450-011-0177-x","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00450-011-0177-x","pdf_url":null,"source":{"id":"https://openalex.org/S22130598","display_name":"Computer Science - Research and Development","issn_l":"1865-2034","issn":["1865-2034","1865-2042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computer Science - Research and Development","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.752.9330","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.752.9330","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://arxiv.org/pdf/1010.3053.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.6499999761581421,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1539265392","https://openalex.org/W1597532222","https://openalex.org/W1610496399","https://openalex.org/W1700279323","https://openalex.org/W1981590391","https://openalex.org/W1997020216","https://openalex.org/W1997927541","https://openalex.org/W2008941054","https://openalex.org/W2024770506","https://openalex.org/W2097225630","https://openalex.org/W2104511295","https://openalex.org/W2108991785","https://openalex.org/W2114296561","https://openalex.org/W2126399065","https://openalex.org/W2131629857","https://openalex.org/W2151930506","https://openalex.org/W2164456230","https://openalex.org/W2170039925","https://openalex.org/W2171574281","https://openalex.org/W2173213060","https://openalex.org/W2223011434","https://openalex.org/W2295151155","https://openalex.org/W2964250627","https://openalex.org/W3146259567","https://openalex.org/W4211012425"],"related_works":["https://openalex.org/W2392835431","https://openalex.org/W2120447654","https://openalex.org/W2977179488","https://openalex.org/W2144453115","https://openalex.org/W2128223750","https://openalex.org/W4238532390","https://openalex.org/W2188872161","https://openalex.org/W1965371215","https://openalex.org/W2002978035","https://openalex.org/W2126932387"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":6}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
