{"id":"https://openalex.org/W4223934638","doi":"https://doi.org/10.1145/3512850.3512856","title":"A Multi-layer Approach for Data Cleaning in the Healthcare Domain","display_name":"A Multi-layer Approach for Data Cleaning in the Healthcare Domain","publication_year":2022,"publication_date":"2022-01-11","ids":{"openalex":"https://openalex.org/W4223934638","doi":"https://doi.org/10.1145/3512850.3512856"},"language":"en","primary_location":{"id":"doi:10.1145/3512850.3512856","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3512850.3512856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 The 8th International Conference on Computing and Data Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041438914","display_name":"Konstantinos Mavrogiorgos","orcid":null},"institutions":[{"id":"https://openalex.org/I154757721","display_name":"University of Piraeus","ror":"https://ror.org/02qs84g94","country_code":"GR","type":"education","lineage":["https://openalex.org/I154757721"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Konstantinos Mavrogiorgos","raw_affiliation_strings":["University of Piraeus, Greece"],"affiliations":[{"raw_affiliation_string":"University of Piraeus, Greece","institution_ids":["https://openalex.org/I154757721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007408273","display_name":"Athanasios Kiourtis","orcid":"https://orcid.org/0000-0002-1681-3626"},"institutions":[{"id":"https://openalex.org/I154757721","display_name":"University of Piraeus","ror":"https://ror.org/02qs84g94","country_code":"GR","type":"education","lineage":["https://openalex.org/I154757721"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Athanasios Kiourtis","raw_affiliation_strings":["University of Piraeus, Greece"],"affiliations":[{"raw_affiliation_string":"University of Piraeus, Greece","institution_ids":["https://openalex.org/I154757721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025387207","display_name":"Argyro Mavrogiorgou","orcid":"https://orcid.org/0000-0002-1543-5627"},"institutions":[{"id":"https://openalex.org/I154757721","display_name":"University of Piraeus","ror":"https://ror.org/02qs84g94","country_code":"GR","type":"education","lineage":["https://openalex.org/I154757721"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Argyro Mavrogiorgou","raw_affiliation_strings":["University of Piraeus, Greece"],"affiliations":[{"raw_affiliation_string":"University of Piraeus, Greece","institution_ids":["https://openalex.org/I154757721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034519985","display_name":"Spyridon Kleftakis","orcid":"https://orcid.org/0000-0002-6237-488X"},"institutions":[{"id":"https://openalex.org/I154757721","display_name":"University of Piraeus","ror":"https://ror.org/02qs84g94","country_code":"GR","type":"education","lineage":["https://openalex.org/I154757721"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Spyridon Kleftakis","raw_affiliation_strings":["University of Piraeus, Greece"],"affiliations":[{"raw_affiliation_string":"University of Piraeus, Greece","institution_ids":["https://openalex.org/I154757721"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069674161","display_name":"Dimosthenis Kyriazis","orcid":"https://orcid.org/0000-0001-7019-7214"},"institutions":[{"id":"https://openalex.org/I154757721","display_name":"University of Piraeus","ror":"https://ror.org/02qs84g94","country_code":"GR","type":"education","lineage":["https://openalex.org/I154757721"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Dimosthenis Kyriazis","raw_affiliation_strings":["University of Piraeus, Greece"],"affiliations":[{"raw_affiliation_string":"University of Piraeus, Greece","institution_ids":["https://openalex.org/I154757721"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5041438914"],"corresponding_institution_ids":["https://openalex.org/I154757721"],"apc_list":null,"apc_paid":null,"fwci":4.5766,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.95134509,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"22","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7398477792739868},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6359584331512451},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5985981822013855},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.5732594728469849},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5579819679260254},{"id":"https://openalex.org/keywords/data-consistency","display_name":"Data consistency","score":0.5457248091697693},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5373951196670532},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5312827825546265},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5287216305732727},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5155408382415771},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.48587745428085327},{"id":"https://openalex.org/keywords/data-extraction","display_name":"Data extraction","score":0.43460822105407715},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.4104686975479126},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.3885036110877991},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.27211087942123413},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18046057224273682},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.17293903231620789}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7398477792739868},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6359584331512451},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5985981822013855},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.5732594728469849},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5579819679260254},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.5457248091697693},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5373951196670532},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5312827825546265},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5287216305732727},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5155408382415771},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.48587745428085327},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.43460822105407715},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.4104686975479126},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3885036110877991},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.27211087942123413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18046057224273682},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.17293903231620789},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3512850.3512856","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3512850.3512856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 The 8th International Conference on Computing and Data Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W13923090","https://openalex.org/W935072310","https://openalex.org/W1569123402","https://openalex.org/W1591052160","https://openalex.org/W1841820628","https://openalex.org/W1999823970","https://openalex.org/W2129598390","https://openalex.org/W2486604124","https://openalex.org/W2540149843","https://openalex.org/W2555756618","https://openalex.org/W2773493195","https://openalex.org/W2792931617","https://openalex.org/W2886924127","https://openalex.org/W2921480582","https://openalex.org/W2940548648","https://openalex.org/W2961651406","https://openalex.org/W2965653205","https://openalex.org/W3012665221","https://openalex.org/W3099805387","https://openalex.org/W3199506417","https://openalex.org/W4237040408","https://openalex.org/W4240849091","https://openalex.org/W4242428206","https://openalex.org/W4242475056","https://openalex.org/W4243814030","https://openalex.org/W4252415590","https://openalex.org/W6797722056"],"related_works":["https://openalex.org/W2386805970","https://openalex.org/W2308026613","https://openalex.org/W2379416403","https://openalex.org/W2901600492","https://openalex.org/W1985571776","https://openalex.org/W2165253724","https://openalex.org/W2769374332","https://openalex.org/W2971748376","https://openalex.org/W2403946900","https://openalex.org/W2349091876"],"abstract_inverted_index":{"It":[0],"is":[1,76,124,167],"an":[2,296],"undeniable":[3],"fact":[4],"that":[5,13,63,75,105,152,252,284],"nowadays":[6],"there":[7,70],"exists":[8],"a":[9,43,73,139,170,205],"plethora":[10],"of":[11,21,35,40,48,82,91,102,122,181,185,191,207,231,243,256,266,280],"sources":[12,32],"can":[14],"generate":[15],"data":[16,65,101,140,151,171,183,221,234,257,286],"with":[17,276],"complex":[18],"and,":[19],"most":[20,39],"the":[22,46,53,80,83,89,92,109,131,135,176,179,182,201,226,229,232,241,249,267,270,277,285,300],"time,":[23],"error-prone":[24],"nature,":[25],"as":[26,28],"well":[27],"multiple":[29,219],"origins.":[30],"Those":[31],"may":[33],"be":[34,72,154],"different":[36,254],"complexity,":[37],"but":[38],"them":[41],"share":[42],"common":[44],"characteristic:":[45],"lack":[47],"performing":[49],"quality":[50,104,177],"checks":[51],"on":[52],"collected":[54,84],"data.":[55],"The":[56,117,188,264],"aforementioned":[57],"implies":[58],"that,":[59],"in":[60,163,260],"every":[61],"platform":[62],"utilizes":[64],"originating":[66],"from":[67,248],"those":[68],"sources,":[69],"should":[71],"mechanism":[74,123,142,173,189,268,288],"responsible":[77,196],"for":[78,114,119,174,197],"assuring":[79,175],"reliability":[81,180],"data,":[85,137,202],"thus":[86,294],"providing":[87,295],"to":[88,108,130,146,149,224],"rest":[90],"platform's":[93],"mechanisms":[94],"(e.g.,":[95],"risk":[96],"analysis":[97],"and":[98,178,199,216,228,258,291],"prediction":[99],"mechanisms)":[100],"high":[103],"could":[106],"lead":[107],"best":[110],"knowledge":[111],"extraction":[112],"possible":[113],"decision":[115],"making.":[116],"need":[118],"this":[120,164],"kind":[121],"even":[125],"greater":[126],"when":[127],"it":[128,166],"comes":[129],"healthcare":[132,150,250],"domain":[133,251],"because":[134],"clean":[136],"which":[138],"cleaning":[141,172,208,222,235,287],"produces,":[143],"are":[144,273],"essential":[145],"bring":[147],"consistency":[148],"might":[153],"inaccurate,":[155],"outdated,":[156],"redundant":[157],"or":[158],"incomplete.":[159],"Considering":[160],"these":[161,281],"challenges,":[162],"paper":[165],"being":[168,195,274],"proposed":[169],"regardless":[184],"their":[186,261],"origin.":[187],"consists":[190],"three":[192,244],"(3)":[193,245],"sub-components,":[194],"ingesting":[198],"storing":[200],"also":[203],"including":[204],"set":[206],"actions.":[209],"These":[210],"actions,":[211],"namely":[212],"\u201cValidation\u201d,":[213],"\u201cCleaning\u201d,":[214],"\u201cVerification\u201d":[215],"\u201cLogging\u201d,":[217],"combine":[218],"well-established":[220],"techniques":[223],"ensure":[225],"effectiveness":[227],"efficiency":[230],"whole":[233],"procedure.":[236],"Its":[237],"evaluation":[238],"process":[239],"includes":[240],"usage":[242],"separate":[246],"datasets":[247],"contain":[253],"types":[255],"errors":[259],"corresponding":[262],"records.":[263],"results":[265],"(i.e.,":[269],"cleaned":[271],"data)":[272],"compared":[275],"ground":[278],"truth":[279],"datasets,":[282],"resulting":[283],"was":[289],"successfully":[290],"efficiently":[292],"preformed,":[293],"extensive":[297],"insight":[298],"regarding":[299],"mechanism's":[301],"capabilities.":[302]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
