{"id":"https://openalex.org/W2003684739","doi":"https://doi.org/10.14778/1687627.1687691","title":"Truth discovery and copying detection in a dynamic world","display_name":"Truth discovery and copying detection in a dynamic world","publication_year":2009,"publication_date":"2009-08-01","ids":{"openalex":"https://openalex.org/W2003684739","doi":"https://doi.org/10.14778/1687627.1687691","mag":"2003684739"},"language":"en","primary_location":{"id":"doi:10.14778/1687627.1687691","is_oa":false,"landing_page_url":"https://doi.org/10.14778/1687627.1687691","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001402526","display_name":"Xin Luna Dong","orcid":"https://orcid.org/0009-0000-8667-322X"},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xin Luna Dong","raw_affiliation_strings":["AT&amp;T Labs--Research, Florham Park, NJ"],"affiliations":[{"raw_affiliation_string":"AT&amp;T Labs--Research, Florham Park, NJ","institution_ids":["https://openalex.org/I1283103587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091872345","display_name":"Laure Berti\u2010\u00c9quille","orcid":"https://orcid.org/0000-0002-8046-0570"},"institutions":[{"id":"https://openalex.org/I56067802","display_name":"Universit\u00e9 de Rennes","ror":"https://ror.org/015m7wh34","country_code":"FR","type":"education","lineage":["https://openalex.org/I56067802"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Laure Berti-Equille","raw_affiliation_strings":["Universit\u00e9 de Rennes, Rennes cedex, France"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Rennes, Rennes cedex, France","institution_ids":["https://openalex.org/I56067802"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088315797","display_name":"Divesh Srivastava","orcid":"https://orcid.org/0000-0002-7609-9217"},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Divesh Srivastava","raw_affiliation_strings":["AT&amp;T Labs--Research, Florham Park, NJ"],"affiliations":[{"raw_affiliation_string":"AT&amp;T Labs--Research, Florham Park, NJ","institution_ids":["https://openalex.org/I1283103587"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5001402526"],"corresponding_institution_ids":["https://openalex.org/I1283103587"],"apc_list":null,"apc_paid":null,"fwci":35.7099,"has_fulltext":false,"cited_by_count":236,"citation_normalized_percentile":{"value":0.99650191,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":"2","issue":"1","first_page":"562","last_page":"573"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7823073267936707},{"id":"https://openalex.org/keywords/copying","display_name":"Copying","score":0.7467880249023438},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6430220007896423},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5933616757392883},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5400444269180298},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5331472754478455},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.519580602645874},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.48666197061538696},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.4601614475250244},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.43928712606430054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2338753342628479},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.17287778854370117}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7823073267936707},{"id":"https://openalex.org/C2779151265","wikidata":"https://www.wikidata.org/wiki/Q1156791","display_name":"Copying","level":2,"score":0.7467880249023438},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6430220007896423},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5933616757392883},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5400444269180298},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5331472754478455},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.519580602645874},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.48666197061538696},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.4601614475250244},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.43928712606430054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2338753342628479},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.17287778854370117},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.14778/1687627.1687691","is_oa":false,"landing_page_url":"https://doi.org/10.14778/1687627.1687691","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.151.5867","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.151.5867","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.vldb.org/pvldb/2/vldb09-335.pdf","raw_type":"text"},{"id":"pmh:oai:HAL:hal-01855862v1","is_oa":false,"landing_page_url":"https://inria.hal.science/hal-01855862","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proceedings of the VLDB Endowment (PVLDB), 2009, 2 (1), pp.562 - 573. &#x27E8;10.14778/1687627.1687691&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1568972313","https://openalex.org/W1580310876","https://openalex.org/W1725819718","https://openalex.org/W1987272746","https://openalex.org/W2002087344","https://openalex.org/W2023838631","https://openalex.org/W2031513076","https://openalex.org/W2073545563","https://openalex.org/W2110411158","https://openalex.org/W2118388899","https://openalex.org/W2125838338","https://openalex.org/W2152191782","https://openalex.org/W2155160033","https://openalex.org/W4231488651"],"related_works":["https://openalex.org/W4308771405","https://openalex.org/W2355873265","https://openalex.org/W2963669501","https://openalex.org/W3080197661","https://openalex.org/W4318471783","https://openalex.org/W2760667490","https://openalex.org/W2991781269","https://openalex.org/W775724729","https://openalex.org/W2137489486","https://openalex.org/W2021042108"],"abstract_inverted_index":{"Modern":[0],"information":[1,39,194],"management":[2],"applications":[3],"often":[4,51,104],"require":[5],"integrating":[6],"data":[7,12,21,27,60,70,81,205,223],"from":[8,22,195],"a":[9,30,156,162,169,172,189,204],"variety":[10],"of":[11,15,48,115,130,139,174,210,229],"sources,":[13,76,125],"some":[14],"which":[16,183],"may":[17,99],"copy":[18],"or":[19],"buy":[20],"other":[23],"sources.":[24],"When":[25],"these":[26,152],"sources":[28,50,62,132,140,197],"model":[29,136,191],"dynamically":[31],"changing":[32],"world":[33],"(":[34,95],"e.g.":[35,96],",":[36,97],"people's":[37],"contact":[38],"changes":[40],"over":[41,141,214],"time,":[42],"restaurants":[43],"open":[44],"and":[45,68,119,147,177,207,221,227],"go":[46],"out":[47],"business),":[49],"provide":[52,85],"out-of-date":[53,67],"data.":[54],"Errors":[55],"can":[56],"also":[57],"creep":[58],"into":[59],"when":[61,126],"are":[63],"updated":[64],"often.":[65],"Given":[66],"erroneous":[69],"provided":[71],"by":[72,143],"different,":[73],"possibly":[74],"dependent,":[75],"it":[77,184],"is":[78,133,171],"challenging":[79],"for":[80,203],"integration":[82],"systems":[83],"to":[84,91,101,198],"the":[86,113,121,127,131,137,179,196,200,208,211],"true":[87,117,201,212],"values.":[88],"Straightforward":[89],"ways":[90],"resolve":[92],"such":[93],"inconsistencies":[94],"voting)":[98],"lead":[100],"noisy":[102],"results,":[103],"with":[105],"detrimental":[106],"consequences.":[107],"In":[108],"this":[109],"paper,":[110],"we":[111,154,160,187],"study":[112],"problem":[114],"finding":[116],"values":[118,213],"determining":[120],"copying":[122],"relationship":[123],"between":[124],"update":[128],"history":[129],"known.":[134],"We":[135],"quality":[138],"time":[142],"their":[144],"coverage,":[145],"exactness":[146],"freshness":[148],".":[149],"Based":[150],"on":[151,218],"measures,":[153],"conduct":[155],"probabilistic":[157],"analysis.":[158],"First,":[159],"develop":[161,188],"Hidden":[163],"Markov":[164],"Model":[165],"that":[166,192],"decides":[167],"whether":[168],"source":[170,176],"copier":[173],"another":[175],"identifies":[178],"specific":[180],"moments":[181],"at":[182],"copies.":[185],"Second,":[186],"Bayesian":[190],"aggregates":[193],"decide":[199],"value":[202],"item,":[206],"evolution":[209],"time.":[215],"Experimental":[216],"results":[217],"both":[219],"real-world":[220],"synthetic":[222],"show":[224],"high":[225],"accuracy":[226],"scalability":[228],"our":[230],"techniques.":[231]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":27},{"year":2018,"cited_by_count":26},{"year":2017,"cited_by_count":21},{"year":2016,"cited_by_count":18},{"year":2015,"cited_by_count":34},{"year":2014,"cited_by_count":19},{"year":2013,"cited_by_count":12},{"year":2012,"cited_by_count":18}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
