{"id":"https://openalex.org/W2806784378","doi":"https://doi.org/10.1145/3206157.3206172","title":"Fast Entropy Attribute Value Frequency Algorithm to Detect Outliers for Categorical Data","display_name":"Fast Entropy Attribute Value Frequency Algorithm to Detect Outliers for Categorical Data","publication_year":2018,"publication_date":"2018-03-09","ids":{"openalex":"https://openalex.org/W2806784378","doi":"https://doi.org/10.1145/3206157.3206172","mag":"2806784378"},"language":"en","primary_location":{"id":"doi:10.1145/3206157.3206172","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3206157.3206172","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3206172&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Conference on Big Data and Education","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dl.acm.org/ft_gateway.cfm?id=3206172&type=pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070482385","display_name":"Kang\u2013Mo Jung","orcid":null},"institutions":[{"id":"https://openalex.org/I120158604","display_name":"Kunsan National University","ror":"https://ror.org/02yj55q56","country_code":"KR","type":"education","lineage":["https://openalex.org/I120158604"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Kang-Mo Jung","raw_affiliation_strings":["Kunsan National University, Department of Statistics &amp; Computer Science, Korea"],"affiliations":[{"raw_affiliation_string":"Kunsan National University, Department of Statistics &amp; Computer Science, Korea","institution_ids":["https://openalex.org/I120158604"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5070482385"],"corresponding_institution_ids":["https://openalex.org/I120158604"],"apc_list":null,"apc_paid":null,"fwci":0.1692,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.58969602,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"63","last_page":"66"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.8894044160842896},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.8772802352905273},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.8288437128067017},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6668892502784729},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6345758438110352},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5857291221618652},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46681711077690125},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.46275991201400757},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4403444528579712},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2528803050518036}],"concepts":[{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.8894044160842896},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.8772802352905273},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.8288437128067017},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6668892502784729},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6345758438110352},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5857291221618652},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46681711077690125},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.46275991201400757},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4403444528579712},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2528803050518036},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3206157.3206172","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3206157.3206172","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3206172&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Conference on Big Data and Education","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3206157.3206172","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3206157.3206172","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3206172&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Conference on Big Data and Education","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.7200000286102295}],"awards":[{"id":"https://openalex.org/G5903378259","display_name":null,"funder_award_id":"106052","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G8661133557","display_name":null,"funder_award_id":"NRF-2015R","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G8952370644","display_name":null,"funder_award_id":"NRF-2015","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G982292920","display_name":null,"funder_award_id":"NRF-20","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2806784378.pdf","grobid_xml":"https://content.openalex.org/works/W2806784378.grobid-xml"},"referenced_works_count":10,"referenced_works":["https://openalex.org/W1874523587","https://openalex.org/W1876967670","https://openalex.org/W2061122559","https://openalex.org/W2064029323","https://openalex.org/W2117891917","https://openalex.org/W2129281431","https://openalex.org/W2498771658","https://openalex.org/W2609353185","https://openalex.org/W2950186804","https://openalex.org/W4253461361"],"related_works":["https://openalex.org/W4386799044","https://openalex.org/W2773208253","https://openalex.org/W2560646951","https://openalex.org/W2499612753","https://openalex.org/W3111802945","https://openalex.org/W2122407924","https://openalex.org/W2946096271","https://openalex.org/W2295423552","https://openalex.org/W1598471830","https://openalex.org/W3107369729"],"abstract_inverted_index":{"Outliers":[0],"are":[1,42],"extreme":[2],"observations":[3,77],"which":[4],"is":[5,56],"far":[6],"away":[7],"from":[8],"other":[9],"observations.":[10],"Outlier":[11],"detection":[12,30,48],"becomes":[13],"a":[14,57,85,96],"significant":[15],"procedure":[16],"for":[17,49,62,99,117],"many":[18],"applications":[19],"such":[20],"as":[21,103,105],"detecting":[22],"insurance":[23],"fraud":[24],"or":[25],"industrial":[26],"damage.":[27],"Most":[28],"outlier":[29,47],"techniques":[31],"work":[32],"on":[33,46],"numerical":[34],"data,":[35],"that":[36],"is,":[37],"continuous":[38],"attributes.":[39,82],"However,":[40],"there":[41],"few":[43],"research":[44],"works":[45],"categorical":[50,63],"data.":[51,64],"AEVF(Automated":[52],"Entropy":[53],"Value":[54],"Frequency)":[55],"measure":[58],"to":[59,73],"detect":[60],"outliers":[61],"AEVF":[65],"has":[66],"complexity,":[67],"and":[68,78],"it":[69],"cannot":[70],"be":[71,114],"applied":[72],"large":[74],"number":[75,80],"of":[76,81,111],"the":[79],"We":[83],"propose":[84,95],"fast":[86,97],"entropy":[87],"attribute":[88],"value":[89],"frequency(FEAVF)":[90],"having":[91],"complexity.":[92],"Furthermore,":[93],"we":[94],"algorithm":[98],"multiple":[100],"records":[101],"deletion":[102],"well":[104],"single":[106],"record":[107],"deletion.":[108],"The":[109],"performance":[110],"FEAVF":[112],"can":[113],"effectively":[115],"illustrated":[116],"UCI":[118],"machine":[119],"learning":[120],"datasets.":[121]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
