{"id":"https://openalex.org/W4400824028","doi":"https://doi.org/10.1007/s10618-024-01056-5","title":"Evaluating outlier probabilities: assessing sharpness, refinement, and calibration using stratified and weighted measures","display_name":"Evaluating outlier probabilities: assessing sharpness, refinement, and calibration using stratified and weighted measures","publication_year":2024,"publication_date":"2024-07-19","ids":{"openalex":"https://openalex.org/W4400824028","doi":"https://doi.org/10.1007/s10618-024-01056-5"},"language":"en","primary_location":{"id":"doi:10.1007/s10618-024-01056-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-024-01056-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-024-01056-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10618-024-01056-5.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047315657","display_name":"Philipp R\u00f6chner","orcid":"https://orcid.org/0000-0003-3376-6670"},"institutions":[{"id":"https://openalex.org/I197323543","display_name":"Johannes Gutenberg University Mainz","ror":"https://ror.org/023b0x485","country_code":"DE","type":"education","lineage":["https://openalex.org/I197323543"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Philipp R\u00f6chner","raw_affiliation_strings":["Johannes Gutenberg University, Mainz, Germany"],"affiliations":[{"raw_affiliation_string":"Johannes Gutenberg University, Mainz, Germany","institution_ids":["https://openalex.org/I197323543"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072064839","display_name":"Henrique O. Marques","orcid":"https://orcid.org/0000-0002-8273-5814"},"institutions":[{"id":"https://openalex.org/I177969490","display_name":"University of Southern Denmark","ror":"https://ror.org/03yrrjy16","country_code":"DK","type":"education","lineage":["https://openalex.org/I177969490"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Henrique O. Marques","raw_affiliation_strings":["University of Southern Denmark, Odense, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Southern Denmark, Odense, Denmark","institution_ids":["https://openalex.org/I177969490"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014723418","display_name":"Ricardo J. G. B. Campello","orcid":"https://orcid.org/0000-0003-0266-3492"},"institutions":[{"id":"https://openalex.org/I177969490","display_name":"University of Southern Denmark","ror":"https://ror.org/03yrrjy16","country_code":"DK","type":"education","lineage":["https://openalex.org/I177969490"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Ricardo J. G. B. Campello","raw_affiliation_strings":["University of Southern Denmark, Odense, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Southern Denmark, Odense, Denmark","institution_ids":["https://openalex.org/I177969490"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047196019","display_name":"Arthur Zimek","orcid":"https://orcid.org/0000-0001-7713-4208"},"institutions":[{"id":"https://openalex.org/I177969490","display_name":"University of Southern Denmark","ror":"https://ror.org/03yrrjy16","country_code":"DK","type":"education","lineage":["https://openalex.org/I177969490"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Arthur Zimek","raw_affiliation_strings":["University of Southern Denmark, Odense, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Southern Denmark, Odense, Denmark","institution_ids":["https://openalex.org/I177969490"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047315657"],"corresponding_institution_ids":["https://openalex.org/I197323543"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":3.0735,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.92384983,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"38","issue":"6","first_page":"3719","last_page":"3757"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11443","display_name":"Advanced Statistical Process Monitoring","score":0.982200026512146,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.793807864189148},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.7663115859031677},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5646056532859802},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5056183338165283},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.47766217589378357},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.444192498922348},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.364518404006958},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3602735996246338},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.335909903049469}],"concepts":[{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.793807864189148},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.7663115859031677},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5646056532859802},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5056183338165283},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.47766217589378357},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.444192498922348},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.364518404006958},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3602735996246338},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.335909903049469}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/s10618-024-01056-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-024-01056-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-024-01056-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"},{"id":"pmh:oai:sdu.dk:publications/d6cc2b85-cddf-4c08-b301-414596b80872","is_oa":true,"landing_page_url":"https://portal.findresearcher.sdu.dk/da/publications/d6cc2b85-cddf-4c08-b301-414596b80872","pdf_url":"https://findresearcher.sdu.dk/ws/files/279311503/s10618-024-01056-5.pdf","source":{"id":"https://openalex.org/S4306400424","display_name":"University of Southern Denmark Research Portal (University of Southern Denmark)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I177969490","host_organization_name":"University of Southern Denmark","host_organization_lineage":["https://openalex.org/I177969490"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"R\u00f6chner, P, Marques, H O, Campello, R J G B & Zimek, A 2024, 'Evaluating outlier probabilities : assessing sharpness, refinement, and calibration using stratified and weighted measures', Data Mining and Knowledge Discovery, vol. 38, no. 6, pp. 3719-3757. https://doi.org/10.1007/s10618-024-01056-5","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:sdu.dk:openaire/d6cc2b85-cddf-4c08-b301-414596b80872","is_oa":true,"landing_page_url":"https://portal.findresearcher.sdu.dk/files/279311503/s10618-024-01056-5.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400423","display_name":"University of Southern Denmark Research Portal (University of Southern Denmark)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I177969490","host_organization_name":"University of Southern Denmark","host_organization_lineage":["https://openalex.org/I177969490"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"R\u00f6chner, P, Marques, H O, Campello, R J G B & Zimek, A 2024, 'Evaluating outlier probabilities : assessing sharpness, refinement, and calibration using stratified and weighted measures', Data Mining and Knowledge Discovery, vol. 38, no. 6, pp. 3719-3757. https://doi.org/10.1007/s10618-024-01056-5","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1007/s10618-024-01056-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-024-01056-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-024-01056-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4400824028.pdf"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W96556717","https://openalex.org/W164607750","https://openalex.org/W309312769","https://openalex.org/W1242748811","https://openalex.org/W1497774109","https://openalex.org/W1545836098","https://openalex.org/W1584412742","https://openalex.org/W1607198972","https://openalex.org/W1981276685","https://openalex.org/W1985749559","https://openalex.org/W1987103639","https://openalex.org/W1995443851","https://openalex.org/W2023943903","https://openalex.org/W2031366272","https://openalex.org/W2041184937","https://openalex.org/W2045765911","https://openalex.org/W2047634553","https://openalex.org/W2049058890","https://openalex.org/W2049633694","https://openalex.org/W2056597459","https://openalex.org/W2073241381","https://openalex.org/W2075159929","https://openalex.org/W2080756387","https://openalex.org/W2098824882","https://openalex.org/W2103914106","https://openalex.org/W2130715829","https://openalex.org/W2160868604","https://openalex.org/W2163757302","https://openalex.org/W2282861635","https://openalex.org/W2769911895","https://openalex.org/W2773235741","https://openalex.org/W2787894218","https://openalex.org/W2791845676","https://openalex.org/W2809161969","https://openalex.org/W3039137796","https://openalex.org/W3089028909","https://openalex.org/W3129166376","https://openalex.org/W3130041243","https://openalex.org/W4226060502","https://openalex.org/W4230927207","https://openalex.org/W4253461361","https://openalex.org/W4254182148","https://openalex.org/W4312423502","https://openalex.org/W4378072425","https://openalex.org/W4384784915"],"related_works":["https://openalex.org/W3006513224","https://openalex.org/W2046456988","https://openalex.org/W2357409937","https://openalex.org/W2510582230","https://openalex.org/W2499612753","https://openalex.org/W3111802945","https://openalex.org/W2946096271","https://openalex.org/W2295423552","https://openalex.org/W1598471830","https://openalex.org/W3107369729"],"abstract_inverted_index":{"Abstract":[0],"An":[1],"outlier":[2,14,19,25,28,34,41,45,54,57,72,80,86,112,123,146,158,195,227,235,251],"probability":[3,6,136,228],"is":[4,10,66,110,210],"the":[5,31,63,122,133,151,169,175,179,191,201,213,239,243,246],"that":[7,84,103,233],"an":[8,11,111,114],"observation":[9,109],"outlier.":[12],"Typically,":[13],"detection":[15,46],"algorithms":[16,47],"calculate":[17],"real-valued":[18],"scores":[20,26,35,42,55],"to":[21,52,56,78,132,150,167,188,238],"identify":[22],"outliers.":[23],"Converting":[24],"into":[27,125,253],"probabilities":[29,58,73,87,124,170,252],"increases":[30],"interpretability":[32],"of":[33,70,135,157,171,178,194,203,215,225,245,249],"for":[36,255],"domain":[37],"experts":[38],"and":[39,74,91,99,118,153,162,182,219,257],"makes":[40,185],"from":[43],"different":[44,226],"comparable.":[48],"Although":[49],"several":[50,140],"transformations":[51],"convert":[53],"have":[59],"been":[60],"proposed":[61,240],"in":[62,137],"literature,":[64],"there":[65],"no":[67,75],"common":[68],"understanding":[69],"good":[71,85,234],"standard":[76],"approach":[77],"evaluate":[79,94,168],"probabilities.":[81,196],"We":[82],"require":[83],"be":[88],"sharp,":[89],"refined,":[90],"calibrated.":[92],"To":[93],"these":[95],"properties,":[96],"we":[97,231],"adapt":[98],"propose":[100],"novel":[101],"measures":[102,120,164],"use":[104,128,177],"ground-truth":[105],"labels":[106,254],"indicating":[107],"which":[108],"or":[113,127],"inlier.":[115],"The":[116],"refinement":[117],"calibration":[119,183],"partition":[121],"bins":[126],"kernel":[129],"smoothing.":[130],"Compared":[131],"evaluation":[134,224],"supervised":[138],"learning,":[139],"aspects":[141],"are":[142,165],"relevant":[143],"when":[144],"evaluating":[145],"probabilities,":[147,236],"mainly":[148],"due":[149],"imbalanced":[152],"often":[154],"unsupervised":[155],"nature":[156],"detection.":[159],"First,":[160],"stratified":[161],"weighted":[163],"necessary":[166],"outliers":[172,256],"well.":[173],"Second,":[174],"joint":[176],"sharpness,":[180],"refinement,":[181],"errors":[184],"it":[186],"possible":[187],"independently":[189],"measure":[190],"corresponding":[192],"characteristics":[193],"Third,":[197],"equiareal":[198],"bins,":[199],"where":[200],"product":[202],"observations":[204,216],"per":[205,217],"bin":[206,208,218,220],"times":[207],"length":[209],"constant,":[211],"balance":[212],"number":[214],"length,":[221],"allowing":[222],"accurate":[223],"ranges.":[229],"Finally,":[230],"show":[232],"according":[237],"measures,":[241],"improve":[242],"performance":[244],"follow-up":[247],"task":[248],"converting":[250],"inliers.":[258]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
