{"id":"https://openalex.org/W1995541812","doi":"https://doi.org/10.1007/s00778-009-0161-2","title":"Creating probabilistic databases from duplicated data","display_name":"Creating probabilistic databases from duplicated data","publication_year":2009,"publication_date":"2009-08-19","ids":{"openalex":"https://openalex.org/W1995541812","doi":"https://doi.org/10.1007/s00778-009-0161-2","mag":"1995541812"},"language":"en","primary_location":{"id":"doi:10.1007/s00778-009-0161-2","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00778-009-0161-2","pdf_url":null,"source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068065546","display_name":"Oktie Hassanzadeh","orcid":"https://orcid.org/0000-0001-5307-9857"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Oktie Hassanzadeh","raw_affiliation_strings":["Department of Computer Science, University of Toronto, Toronto, Canada","Department of Computer Science, University of Toronto, Toronto, CANADA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Toronto, Toronto, Canada","institution_ids":["https://openalex.org/I185261750"]},{"raw_affiliation_string":"Department of Computer Science, University of Toronto, Toronto, CANADA","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022619313","display_name":"Ren\u00e9e J. Miller","orcid":"https://orcid.org/0000-0002-1484-4787"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ren\u00e9e J. Miller","raw_affiliation_strings":["Department of Computer Science, University of Toronto, Toronto, Canada","Department of Computer Science, University of Toronto, Toronto, CANADA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Toronto, Toronto, Canada","institution_ids":["https://openalex.org/I185261750"]},{"raw_affiliation_string":"Department of Computer Science, University of Toronto, Toronto, CANADA","institution_ids":["https://openalex.org/I185261750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068065546"],"corresponding_institution_ids":["https://openalex.org/I185261750"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":null,"fwci":7.9242,"has_fulltext":false,"cited_by_count":60,"citation_normalized_percentile":{"value":0.97404844,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"18","issue":"5","first_page":"1141","last_page":"1166"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10927","display_name":"Access Control and Trust","score":0.9690999984741211,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8055433034896851},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.638297975063324},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.616685152053833},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6016305685043335},{"id":"https://openalex.org/keywords/data-deduplication","display_name":"Data deduplication","score":0.5690258741378784},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5347629189491272},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.48910433053970337},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.4803296625614166},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.46370774507522583},{"id":"https://openalex.org/keywords/probabilistic-database","display_name":"Probabilistic database","score":0.45166897773742676},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36616379022598267},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2660927176475525},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23520976305007935},{"id":"https://openalex.org/keywords/database-theory","display_name":"Database theory","score":0.21991348266601562},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.19928818941116333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8055433034896851},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.638297975063324},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.616685152053833},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6016305685043335},{"id":"https://openalex.org/C32587265","wikidata":"https://www.wikidata.org/wiki/Q1182260","display_name":"Data deduplication","level":2,"score":0.5690258741378784},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5347629189491272},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.48910433053970337},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4803296625614166},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.46370774507522583},{"id":"https://openalex.org/C174539288","wikidata":"https://www.wikidata.org/wiki/Q7246853","display_name":"Probabilistic database","level":4,"score":0.45166897773742676},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36616379022598267},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2660927176475525},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23520976305007935},{"id":"https://openalex.org/C12439846","wikidata":"https://www.wikidata.org/wiki/Q4809258","display_name":"Database theory","level":3,"score":0.21991348266601562},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.19928818941116333},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00778-009-0161-2","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00778-009-0161-2","pdf_url":null,"source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W192724328","https://openalex.org/W254113056","https://openalex.org/W938539187","https://openalex.org/W1486776102","https://openalex.org/W1536860849","https://openalex.org/W1564399566","https://openalex.org/W1569123402","https://openalex.org/W1610496399","https://openalex.org/W1612155886","https://openalex.org/W1646278814","https://openalex.org/W1880262756","https://openalex.org/W1985875030","https://openalex.org/W1990061958","https://openalex.org/W2010595692","https://openalex.org/W2011015278","https://openalex.org/W2024605621","https://openalex.org/W2024932032","https://openalex.org/W2030724586","https://openalex.org/W2036216970","https://openalex.org/W2044494469","https://openalex.org/W2064244056","https://openalex.org/W2073471108","https://openalex.org/W2078686663","https://openalex.org/W2091858563","https://openalex.org/W2092819480","https://openalex.org/W2095368471","https://openalex.org/W2096598900","https://openalex.org/W2097776316","https://openalex.org/W2103269600","https://openalex.org/W2105423800","https://openalex.org/W2108991785","https://openalex.org/W2113076747","https://openalex.org/W2113415503","https://openalex.org/W2114760689","https://openalex.org/W2119057313","https://openalex.org/W2119095788","https://openalex.org/W2121433213","https://openalex.org/W2121564430","https://openalex.org/W2123561513","https://openalex.org/W2127675794","https://openalex.org/W2129598390","https://openalex.org/W2133676910","https://openalex.org/W2138271690","https://openalex.org/W2140757415","https://openalex.org/W2143485006","https://openalex.org/W2148524305","https://openalex.org/W2153508518","https://openalex.org/W2154368191","https://openalex.org/W2161936973","https://openalex.org/W2164625277","https://openalex.org/W2166994031","https://openalex.org/W2167372977","https://openalex.org/W2340365916","https://openalex.org/W2610179052","https://openalex.org/W2914959486","https://openalex.org/W3146259567"],"related_works":["https://openalex.org/W12581771","https://openalex.org/W1774414873","https://openalex.org/W2000084727","https://openalex.org/W2744606804","https://openalex.org/W2739264497","https://openalex.org/W2103934874","https://openalex.org/W4238495367","https://openalex.org/W2125434953","https://openalex.org/W2749065928","https://openalex.org/W2128160835"],"abstract_inverted_index":null,"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
