{"id":"https://openalex.org/W2296190009","doi":"https://doi.org/10.5220/0005594700360045","title":"POP: A Parallel Optimized Preparation of Data for Data Mining","display_name":"POP: A Parallel Optimized Preparation of Data for Data Mining","publication_year":2015,"publication_date":"2015-01-01","ids":{"openalex":"https://openalex.org/W2296190009","doi":"https://doi.org/10.5220/0005594700360045","mag":"2296190009"},"language":"en","primary_location":{"id":"doi:10.5220/0005594700360045","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0005594700360045","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th International Joint Conference on Knowledge Discovery, Knowledge Engineering and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0005594700360045","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003919873","display_name":"Christian Ernst","orcid":null},"institutions":[{"id":"https://openalex.org/I3019848993","display_name":"Mines Saint-\u00c9tienne","ror":"https://ror.org/05a1dws80","country_code":"FR","type":"education","lineage":["https://openalex.org/I203339264","https://openalex.org/I205703379","https://openalex.org/I3019848993"]},{"id":"https://openalex.org/I4210099416","display_name":"Laboratoire d'Informatique, de Mod\u00e9lisation et d'Optimisation des Syst\u00e8mes","ror":"https://ror.org/00t3fpp34","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I198244214","https://openalex.org/I198244214","https://openalex.org/I203339264","https://openalex.org/I205703379","https://openalex.org/I3019848993","https://openalex.org/I4210099416","https://openalex.org/I4210123221","https://openalex.org/I4210159245","https://openalex.org/I4387154249"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Christian Ernst","raw_affiliation_strings":["Ecole des Mines de St Etienne and LIMOS, France"],"affiliations":[{"raw_affiliation_string":"Ecole des Mines de St Etienne and LIMOS, France","institution_ids":["https://openalex.org/I3019848993","https://openalex.org/I4210099416"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034042028","display_name":"Youssef Hmamouche","orcid":"https://orcid.org/0009-0002-1831-7295"},"institutions":[{"id":"https://openalex.org/I21491767","display_name":"Aix-Marseille Universit\u00e9","ror":"https://ror.org/035xkbk20","country_code":"FR","type":"education","lineage":["https://openalex.org/I21491767"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Youssef Hmamouche","raw_affiliation_strings":["Aix Marseille Universite, France"],"affiliations":[{"raw_affiliation_string":"Aix Marseille Universite, France","institution_ids":["https://openalex.org/I21491767"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046438141","display_name":"Alain Casali","orcid":null},"institutions":[{"id":"https://openalex.org/I21491767","display_name":"Aix-Marseille Universit\u00e9","ror":"https://ror.org/035xkbk20","country_code":"FR","type":"education","lineage":["https://openalex.org/I21491767"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Alain Casali","raw_affiliation_strings":["Aix Marseille Universite, France"],"affiliations":[{"raw_affiliation_string":"Aix Marseille Universite, France","institution_ids":["https://openalex.org/I21491767"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003919873"],"corresponding_institution_ids":["https://openalex.org/I3019848993","https://openalex.org/I4210099416"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.10585442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"36","last_page":"45"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discretization","display_name":"Discretization","score":0.9018659591674805},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.7106906175613403},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7088955640792847},{"id":"https://openalex.org/keywords/discretization-of-continuous-features","display_name":"Discretization of continuous features","score":0.6734433770179749},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5974046587944031},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5355287790298462},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.5105620622634888},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5042184591293335},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.45679476857185364},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4328489303588867},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.371123731136322},{"id":"https://openalex.org/keywords/discretization-error","display_name":"Discretization error","score":0.36387819051742554},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.24835968017578125},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2376776933670044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20346012711524963},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.1470763385295868}],"concepts":[{"id":"https://openalex.org/C73000952","wikidata":"https://www.wikidata.org/wiki/Q17007827","display_name":"Discretization","level":2,"score":0.9018659591674805},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.7106906175613403},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7088955640792847},{"id":"https://openalex.org/C105427703","wikidata":"https://www.wikidata.org/wiki/Q665193","display_name":"Discretization of continuous features","level":4,"score":0.6734433770179749},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5974046587944031},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5355287790298462},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.5105620622634888},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5042184591293335},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.45679476857185364},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4328489303588867},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.371123731136322},{"id":"https://openalex.org/C126148662","wikidata":"https://www.wikidata.org/wiki/Q3890355","display_name":"Discretization error","level":3,"score":0.36387819051742554},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.24835968017578125},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2376776933670044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20346012711524963},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.1470763385295868},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5220/0005594700360045","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0005594700360045","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th International Joint Conference on Knowledge Discovery, Knowledge Engineering and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.5220/0005594700360045","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0005594700360045","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th International Joint Conference on Knowledge Discovery, Knowledge Engineering and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W158024899","https://openalex.org/W567872570","https://openalex.org/W1530010412","https://openalex.org/W1553696291","https://openalex.org/W1978239142","https://openalex.org/W1990701202","https://openalex.org/W2017238524","https://openalex.org/W2061122559","https://openalex.org/W2079615115","https://openalex.org/W2129905273","https://openalex.org/W2154106727","https://openalex.org/W2154714154","https://openalex.org/W2161160262","https://openalex.org/W2229992002","https://openalex.org/W2238565287","https://openalex.org/W2319794630","https://openalex.org/W2733465072","https://openalex.org/W2742334063","https://openalex.org/W2963512953","https://openalex.org/W3011400958","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2499612753","https://openalex.org/W3111802945","https://openalex.org/W2946096271","https://openalex.org/W2295423552","https://openalex.org/W1598471830","https://openalex.org/W3107369729","https://openalex.org/W37066597","https://openalex.org/W2028070877","https://openalex.org/W1993570899","https://openalex.org/W69783631"],"abstract_inverted_index":{"In":[0],"light":[1],"of":[2,26,36,65,96],"the":[3,24,37,52,58,63,81,89,93,110,141,148],"fact":[4],"that":[5,62,136,146],"data":[6,13,25,71],"preparation":[7],"has":[8],"a":[9,116],"substantial":[10],"impact":[11],"on":[12,39,69,115],"mining":[14],"results,":[15],"we":[16,60,103],"provide":[17],"an":[18,44,66,105],"original":[19],"framework":[20],"for":[21,33,108],"automatically":[22],"preparing":[23],"any":[27],"given":[28],"database.":[29],"Our":[30],"research":[31],"focuses,":[32],"each":[34],"attribute":[35],"database,":[38],"two":[40],"points:":[41],"(i)":[42],"Specifying":[43],"optimized":[45,111],"outlier":[46,67],"detection":[47,64],"method,":[48,84],"and":[49],"(ii),":[50],"Identifying":[51],"most":[53],"appropriate":[54],"discretization":[55,83,112,144],"method.":[56],"Concerning":[57],"former,":[59],"illustrate":[61],"depends":[68],"if":[70],"distribution":[72,98],"is":[73,86,88,138,147],"normal":[74],"or":[75],"not.":[76],"When":[77],"attempting":[78],"to":[79],"discern":[80],"best":[82],"what":[85],"important":[87],"shape":[90],"followed":[91],"by":[92],"density":[94],"function":[95],"its":[97],"law.":[99],"For":[100],"this":[101],"reason,":[102],"propose":[104],"automatic":[106],"choice":[107],"finding":[109],"method":[113,145],"based":[114],"multi-criteria":[117],"(Entropy,":[118],"Variance,":[119],"Stability)":[120],"evaluation.":[121],"Processings":[122],"are":[123],"performed":[124],"in":[125],"parallel":[126],"using":[127],"multicore":[128],"capabilities.":[129],"Conducted":[130],"experiments":[131],"validate":[132],"our":[133],"approach,":[134],"showing":[135],"it":[137],"not":[139],"always":[140],"very":[142],"same":[143],"best.":[149]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
