{"id":"https://openalex.org/W2019331060","doi":"https://doi.org/10.1145/1516360.1516458","title":"Time-completeness trade-offs in record linkage using adaptive query processing","display_name":"Time-completeness trade-offs in record linkage using adaptive query processing","publication_year":2009,"publication_date":"2009-03-24","ids":{"openalex":"https://openalex.org/W2019331060","doi":"https://doi.org/10.1145/1516360.1516458","mag":"2019331060"},"language":"en","primary_location":{"id":"doi:10.1145/1516360.1516458","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1516360.1516458","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1516360.1516458","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/1516360.1516458","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028531635","display_name":"Roald Lengu","orcid":null},"institutions":[{"id":"https://openalex.org/I83816512","display_name":"University of Genoa","ror":"https://ror.org/0107c5v14","country_code":"IT","type":"education","lineage":["https://openalex.org/I83816512"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Roald Lengu","raw_affiliation_strings":["Universit\u00e0 di Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Universit\u00e0 di Genova, Italy","institution_ids":["https://openalex.org/I83816512"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018918066","display_name":"Paolo Missier","orcid":"https://orcid.org/0000-0002-0978-2446"},"institutions":[{"id":"https://openalex.org/I28407311","display_name":"University of Manchester","ror":"https://ror.org/027m9bs27","country_code":"GB","type":"education","lineage":["https://openalex.org/I28407311"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paolo Missier","raw_affiliation_strings":["University of Manchester, UK","University of Manchester (UK)"],"affiliations":[{"raw_affiliation_string":"University of Manchester, UK","institution_ids":["https://openalex.org/I28407311"]},{"raw_affiliation_string":"University of Manchester (UK)","institution_ids":["https://openalex.org/I28407311"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057541402","display_name":"Alvaro A. A. Fernandes","orcid":"https://orcid.org/0000-0002-6100-7199"},"institutions":[{"id":"https://openalex.org/I28407311","display_name":"University of Manchester","ror":"https://ror.org/027m9bs27","country_code":"GB","type":"education","lineage":["https://openalex.org/I28407311"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alvaro A. A. Fernandes","raw_affiliation_strings":["University of Manchester, UK","University of Manchester (UK)"],"affiliations":[{"raw_affiliation_string":"University of Manchester, UK","institution_ids":["https://openalex.org/I28407311"]},{"raw_affiliation_string":"University of Manchester (UK)","institution_ids":["https://openalex.org/I28407311"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020065998","display_name":"Giovanna Guerrini","orcid":"https://orcid.org/0000-0001-9125-9867"},"institutions":[{"id":"https://openalex.org/I83816512","display_name":"University of Genoa","ror":"https://ror.org/0107c5v14","country_code":"IT","type":"education","lineage":["https://openalex.org/I83816512"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giovanna Guerrini","raw_affiliation_strings":["Universit\u00e0 di Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Universit\u00e0 di Genova, Italy","institution_ids":["https://openalex.org/I83816512"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089929382","display_name":"Marco Mesiti","orcid":"https://orcid.org/0000-0001-5701-0080"},"institutions":[{"id":"https://openalex.org/I189158943","display_name":"University of Milan","ror":"https://ror.org/00wjc7c48","country_code":"IT","type":"education","lineage":["https://openalex.org/I189158943"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Mesiti","raw_affiliation_strings":["Universit\u00e0 di Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Universit\u00e0 di Milano, Italy","institution_ids":["https://openalex.org/I189158943"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5028531635"],"corresponding_institution_ids":["https://openalex.org/I83816512"],"apc_list":null,"apc_paid":null,"fwci":2.0802,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.87304314,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"851","last_page":"861"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9828000068664551,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/joins","display_name":"Joins","score":0.79561448097229},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7892372012138367},{"id":"https://openalex.org/keywords/completeness","display_name":"Completeness (order theory)","score":0.7685282826423645},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.7634372711181641},{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.6153436303138733},{"id":"https://openalex.org/keywords/join","display_name":"Join (topology)","score":0.5386111736297607},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5180563926696777},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4933835566043854},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.4875468611717224},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3940916657447815},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23800408840179443},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15243706107139587},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.121980220079422}],"concepts":[{"id":"https://openalex.org/C2778692605","wikidata":"https://www.wikidata.org/wiki/Q4041866","display_name":"Joins","level":2,"score":0.79561448097229},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892372012138367},{"id":"https://openalex.org/C17231256","wikidata":"https://www.wikidata.org/wiki/Q5156540","display_name":"Completeness (order theory)","level":2,"score":0.7685282826423645},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.7634372711181641},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.6153436303138733},{"id":"https://openalex.org/C2776124973","wikidata":"https://www.wikidata.org/wiki/Q3183033","display_name":"Join (topology)","level":2,"score":0.5386111736297607},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5180563926696777},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4933835566043854},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.4875468611717224},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3940916657447815},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23800408840179443},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15243706107139587},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.121980220079422},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":8,"locations":[{"id":"doi:10.1145/1516360.1516458","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1516360.1516458","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1516360.1516458","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/f565634c-7f64-46bd-9748-db518da57402","is_oa":false,"landing_page_url":"https://research.manchester.ac.uk/en/publications/f565634c-7f64-46bd-9748-db518da57402","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lengu, R, Missier, P, Fernandes, A A A, Guerrini, G & Mesiti, M 2009, Time-completeness trade-offs in record linkage using adaptive query processing. in Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09|Proc. Int. Conf. Extending Database Technol.: Adv. Database Technol., EDBT. Association for Computing Machinery, pp. 851-861, 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09, Saint Petersburg, 1/07/09. https://doi.org/10.1145/1516360.1516458","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.149.4192","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.149.4192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.man.ac.uk/~alvaro/publications/edbt2009.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.158.8799","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.158.8799","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.man.ac.uk/~pmissier/docs/lmfmg-edbt.pdf","raw_type":"text"},{"id":"pmh:oai:air.unimi.it:2434/202320","is_oa":true,"landing_page_url":"http://hdl.handle.net/2434/202320","pdf_url":null,"source":{"id":"https://openalex.org/S4306400516","display_name":"Archivio Istituzionale della Ricerca (Universita Degli Studi Di Milano)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I189158943","host_organization_name":"University of Milan","host_organization_lineage":["https://openalex.org/I189158943"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:iris.unige.it:11567/237921","is_oa":false,"landing_page_url":"http://hdl.handle.net/11567/237921","pdf_url":null,"source":{"id":"https://openalex.org/S4377196291","display_name":"CINECA IRIS Institutial Research Information System (University of Genoa)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I83816512","host_organization_name":"University of Genoa","host_organization_lineage":["https://openalex.org/I83816512"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/bookPart"},{"id":"pmh:oai:pure.atira.dk:publications/e39cd548-ed2c-4a90-8be4-3bf011b2d00e","is_oa":true,"landing_page_url":"https://research.birmingham.ac.uk/en/publications/e39cd548-ed2c-4a90-8be4-3bf011b2d00e","pdf_url":null,"source":{"id":"https://openalex.org/S4306402634","display_name":"University of Birmingham Research Portal (University of Birmingham)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79619799","host_organization_name":"University of Birmingham","host_organization_lineage":["https://openalex.org/I79619799"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Lengu , R , Missier , P , Fernandes , A A A , Guerrini , G & Mesiti , M 2009 , Time-completeness trade-offs in record linkage using adaptive query processing . in Proceedings of the 12th International Conference on Extending Database Technology : Advances in Database Technology, EDBT'09 . Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09 , pp. 851-861 , 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09 , Saint Petersburg , Russian Federation , 24/03/09 . https://doi.org/10.1145/1516360.1516458","raw_type":"contributionToPeriodical"},{"id":"pmh:oai:pure.atira.dk:publications/f565634c-7f64-46bd-9748-db518da57402","is_oa":false,"landing_page_url":"https://www.research.manchester.ac.uk/portal/en/publications/timecompleteness-tradeoffs-in-record-linkage-using-adaptive-query-processing(f565634c-7f64-46bd-9748-db518da57402).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Lengu, R, Missier, P, Fernandes, A A A, Guerrini, G & Mesiti, M 2009, Time-completeness trade-offs in record linkage using adaptive query processing. in Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09|Proc. Int. Conf. Extending Database Technol.: Adv. Database Technol., EDBT. Association for Computing Machinery, pp. 851-861, 12th International Conference on Extending Database Technology: Advances in Database Technology, EDBT'09, Saint Petersburg, 1/07/09. https://doi.org/10.1145/1516360.1516458","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1145/1516360.1516458","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1516360.1516458","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1516360.1516458","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2019331060.pdf","grobid_xml":"https://content.openalex.org/works/W2019331060.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W183249055","https://openalex.org/W340636835","https://openalex.org/W1485156179","https://openalex.org/W1494213010","https://openalex.org/W1515739837","https://openalex.org/W1519440323","https://openalex.org/W1539265392","https://openalex.org/W1571065273","https://openalex.org/W1700279323","https://openalex.org/W1990911977","https://openalex.org/W2041563709","https://openalex.org/W2074013691","https://openalex.org/W2098082683","https://openalex.org/W2106895292","https://openalex.org/W2108075439","https://openalex.org/W2108991785","https://openalex.org/W2109149785","https://openalex.org/W2121516976","https://openalex.org/W2122306341","https://openalex.org/W2129413111","https://openalex.org/W2129598390","https://openalex.org/W2130846207","https://openalex.org/W2138793904","https://openalex.org/W2140894225","https://openalex.org/W2158237121","https://openalex.org/W2161600801","https://openalex.org/W2161936973","https://openalex.org/W2162747054","https://openalex.org/W2545307730","https://openalex.org/W2766000922","https://openalex.org/W4206606839","https://openalex.org/W4301404790","https://openalex.org/W6607508199","https://openalex.org/W6675849627","https://openalex.org/W6679499423","https://openalex.org/W6680982454","https://openalex.org/W6683401941","https://openalex.org/W6683628169"],"related_works":["https://openalex.org/W2368709504","https://openalex.org/W2070598375","https://openalex.org/W2073547112","https://openalex.org/W2594300663","https://openalex.org/W1760549314","https://openalex.org/W2142204059","https://openalex.org/W2015372451","https://openalex.org/W4205954133","https://openalex.org/W1804205637","https://openalex.org/W31162901"],"abstract_inverted_index":{"Applications":[0],"that":[1,20,40,117,162,170],"involve":[2],"data":[3,14,32,37,46],"integration":[4,84],"among":[5],"multiple":[6,144],"sources":[7],"often":[8],"require":[9,41],"a":[10,94,100,112,119,186],"preliminary":[11],"step":[12],"of":[13,44,93,107,121,185],"reconciliation":[15,38],"in":[16,81,97,173,180,189],"order":[17],"to":[18,69,89,153],"ensure":[19],"tuples":[21],"match":[22],"correctly":[23],"across":[24],"the":[25,45,64,78,91,105,183],"sources.":[26],"In":[27,73],"dynamic":[28,83],"settings":[29],"such":[30],"as":[31],"mashups,":[33],"however,":[34],"traditional":[35],"offline":[36],"techniques":[39],"prior":[42],"availability":[43],"may":[47,87],"not":[48],"be":[49,178],"applicable.":[50],"The":[51,133],"alternative,":[52],"performing":[53],"similarity":[54],"joins":[55],"at":[56,182],"query":[57,130,147],"time,":[58],"is":[59,135,159,165],"computationally":[60],"expensive,":[61],"while":[62],"ignoring":[63],"mismatch":[65],"problem":[66],"altogether":[67],"leads":[68],"an":[70],"incomplete":[71],"integration.":[72],"this":[74,108],"paper":[75],"we":[76],"make":[77],"assumption":[79,109],"that,":[80],"some":[82],"scenarios,":[85],"users":[86],"agree":[88],"trade":[90],"completeness":[92,164],"join":[95,115,125,142,155,174],"result":[96,163,190],"return":[98],"for":[99],"faster":[101],"computation.":[102],"We":[103],"explore":[104],"consequences":[106],"by":[110],"proposing":[111],"novel,":[113],"hybrid":[114],"algorithm":[116,134],"involves":[118],"combination":[120],"exact":[122],"and":[123],"approximate":[124,154],"operators,":[126],"managed":[127],"using":[128],"adaptive":[129],"processing":[131],"techniques.":[132],"optimistic:":[136],"it":[137,150],"can":[138,177],"switch":[139],"between":[140],"physical":[141],"operators":[143,156],"times":[145],"throughout":[146],"processing,":[148],"but":[149],"only":[151],"resorts":[152],"when":[157],"there":[158],"statistical":[160],"evidence":[161],"compromised.":[166],"Our":[167],"experiments":[168],"show":[169],"sensible":[171],"savings":[172],"execution":[175],"time":[176],"achieved":[179],"practice,":[181],"expense":[184],"modest":[187],"reduction":[188],"completeness.":[191]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
