{"id":"https://openalex.org/W2294655953","doi":"https://doi.org/10.5220/0004491101380149","title":"Automatic Synthesis of Data Cleansing Activities","display_name":"Automatic Synthesis of Data Cleansing Activities","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W2294655953","doi":"https://doi.org/10.5220/0004491101380149","mag":"2294655953"},"language":"en","primary_location":{"id":"doi:10.5220/0004491101380149","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004491101380149","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Data Technologies and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0004491101380149","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039716498","display_name":"Mario Mezzanzanica","orcid":"https://orcid.org/0000-0003-0399-2810"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Mario Mezzanzanica","raw_affiliation_strings":["Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058377858","display_name":"Roberto Boselli","orcid":"https://orcid.org/0000-0002-4574-3137"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Roberto Boselli","raw_affiliation_strings":["Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049259722","display_name":"Mirko Cesarini","orcid":"https://orcid.org/0000-0001-9601-0403"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mirko Cesarini","raw_affiliation_strings":["Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047827615","display_name":"Fabio Mercorio","orcid":"https://orcid.org/0000-0001-6864-2702"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabio Mercorio","raw_affiliation_strings":["Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Statistics and Quantitative Methods -C.R.I.S.P. Research Centre, University of Milan-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5039716498"],"corresponding_institution_ids":["https://openalex.org/I66752286"],"apc_list":null,"apc_paid":null,"fwci":4.5206,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.94796281,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"138","last_page":"149"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9790999889373779,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-cleansing","display_name":"Data cleansing","score":0.9131394624710083},{"id":"https://openalex.org/keywords/cleanser","display_name":"Cleanser","score":0.8134480714797974},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.806032657623291},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6835249066352844},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6260969042778015},{"id":"https://openalex.org/keywords/data-consistency","display_name":"Data consistency","score":0.543563723564148},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.541313648223877},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5094638466835022},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.482854425907135},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4580357074737549},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3351774215698242},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23841631412506104},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.21435877680778503},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.19729626178741455}],"concepts":[{"id":"https://openalex.org/C42199009","wikidata":"https://www.wikidata.org/wiki/Q1172378","display_name":"Data cleansing","level":4,"score":0.9131394624710083},{"id":"https://openalex.org/C2780941728","wikidata":"https://www.wikidata.org/wiki/Q17990675","display_name":"Cleanser","level":2,"score":0.8134480714797974},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.806032657623291},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6835249066352844},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6260969042778015},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.543563723564148},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.541313648223877},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5094638466835022},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.482854425907135},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4580357074737549},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3351774215698242},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23841631412506104},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.21435877680778503},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.19729626178741455},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0004491101380149","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004491101380149","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Data Technologies and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:boa.unimib.it:10281/44493","is_oa":false,"landing_page_url":"http://hdl.handle.net/10281/44493","pdf_url":null,"source":{"id":"https://openalex.org/S4306401259","display_name":"BOA (University of Milano-Bicocca)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66752286","host_organization_name":"University of Milano-Bicocca","host_organization_lineage":["https://openalex.org/I66752286"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"doi:10.5220/0004491101380149","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004491101380149","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Data Technologies and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W178555045","https://openalex.org/W997400855","https://openalex.org/W1499805410","https://openalex.org/W1535740288","https://openalex.org/W1539265392","https://openalex.org/W1544828112","https://openalex.org/W1555519929","https://openalex.org/W1585267848","https://openalex.org/W1587682423","https://openalex.org/W1626378195","https://openalex.org/W1668408280","https://openalex.org/W1700279323","https://openalex.org/W1861600621","https://openalex.org/W1963856566","https://openalex.org/W1978460233","https://openalex.org/W2033657926","https://openalex.org/W2039143807","https://openalex.org/W2046769817","https://openalex.org/W2059009730","https://openalex.org/W2060646170","https://openalex.org/W2070386554","https://openalex.org/W2073254505","https://openalex.org/W2079040219","https://openalex.org/W2080593426","https://openalex.org/W2108991785","https://openalex.org/W2293763696","https://openalex.org/W2340735175","https://openalex.org/W2569536984","https://openalex.org/W2913459036","https://openalex.org/W3146259567"],"related_works":["https://openalex.org/W2240123196","https://openalex.org/W2386805970","https://openalex.org/W2308026613","https://openalex.org/W2379416403","https://openalex.org/W2901600492","https://openalex.org/W2165253724","https://openalex.org/W1985571776","https://openalex.org/W2971748376","https://openalex.org/W2769374332","https://openalex.org/W2167069786"],"abstract_inverted_index":{"Data":[0],"cleansing":[1,44,95,130],"is":[2,28,57,65],"growing":[3],"in":[4,41],"importance":[5],"among":[6],"both":[7],"public":[8],"and":[9,150,166],"private":[10],"organisations,":[11],"mainly":[12],"due":[13],"to":[14,30,103,128,136,154],"the":[15,53,63,72,81,91,141,147,155,159],"relevant":[16],"amount":[17],"of":[18,62,74,83,93,124],"data":[19,43,64,100],"exploited":[20],"for":[21,97],"supporting":[22],"decision":[23],"making":[24,146],"processes.":[25],"This":[26],"paper":[27],"aimed":[29],"show":[31],"how":[32],"model-based":[33],"verification":[34],"algorithms":[35],"(namely,":[36],"model":[37,69],"checking)":[38],"can":[39,118,163],"contribute":[40],"addressing":[42],"issues,":[45],"furthermore":[46],"a":[47,68,104,122,137],"new":[48],"benchmark":[49],"problem":[50],"focusing":[51],"on":[52,71],"labour":[54,143],"market":[55,144],"dynamic":[56],"introduced.":[58],"The":[59,115],"consistent":[60],"evolution":[61],"checked":[66],"using":[67],"defined":[70],"basis":[73],"domain":[75],"knowledge.":[76],"Then,":[77],"we":[78,161],"formally":[79],"introduce":[80],"concept":[82],"universal":[84,116],"cleanser,":[85],"i.e.":[86],"an":[87,110],"object":[88],"which":[89,112],"summarises":[90],"set":[92],"all":[94],"actions":[96],"each":[98],"feasible":[99],"inconsistency":[101],"(according":[102],"given":[105],"consistency":[106],"model),":[107],"then":[108],"providing":[109],"algorithm":[111],"synthesises":[113],"it.":[114],"cleanser":[117],"be":[119,164],"seen":[120],"as":[121],"repository":[123],"corrective":[125],"interventions":[126],"useful":[127],"develop":[129],"routines.":[131],"We":[132],"applied":[133],"our":[134],"approach":[135],"dataset":[138,149],"derived":[139],"from":[140],"Italian":[142],"data,":[145],"whole":[148],"outcomes":[151],"publicly":[152],"available":[153],"community,":[156],"so":[157],"that":[158],"results":[160],"present":[162],"shared":[165],"compared":[167],"with":[168],"other":[169],"techniques":[170]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
