{"id":"https://openalex.org/W4406799292","doi":"https://doi.org/10.1186/s40537-024-01041-1","title":"A problem-agnostic approach to feature selection and analysis using SHAP","display_name":"A problem-agnostic approach to feature selection and analysis using SHAP","publication_year":2025,"publication_date":"2025-01-24","ids":{"openalex":"https://openalex.org/W4406799292","doi":"https://doi.org/10.1186/s40537-024-01041-1"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-024-01041-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-01041-1","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-01041-1","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-01041-1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047489766","display_name":"John Hancock","orcid":null},"institutions":[{"id":"https://openalex.org/I63772739","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387","country_code":"US","type":"education","lineage":["https://openalex.org/I63772739"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"John T. Hancock","raw_affiliation_strings":["College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA"],"affiliations":[{"raw_affiliation_string":"College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA","institution_ids":["https://openalex.org/I63772739"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089170562","display_name":"Taghi M. Khoshgoftaar","orcid":null},"institutions":[{"id":"https://openalex.org/I63772739","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387","country_code":"US","type":"education","lineage":["https://openalex.org/I63772739"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Taghi M. Khoshgoftaar","raw_affiliation_strings":["College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA"],"affiliations":[{"raw_affiliation_string":"College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA","institution_ids":["https://openalex.org/I63772739"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088443245","display_name":"Qianxin Liang","orcid":null},"institutions":[{"id":"https://openalex.org/I63772739","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387","country_code":"US","type":"education","lineage":["https://openalex.org/I63772739"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qianxin Liang","raw_affiliation_strings":["College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA"],"affiliations":[{"raw_affiliation_string":"College of Engineering and Computer Science, Florida Atlantic University, Boca Raton, USA","institution_ids":["https://openalex.org/I63772739"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5047489766"],"corresponding_institution_ids":["https://openalex.org/I63772739"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":111.275,"has_fulltext":true,"cited_by_count":51,"citation_normalized_percentile":{"value":0.99966432,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"12","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.830533504486084},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.6963107585906982},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.6814931035041809},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5839062929153442},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5488243699073792},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30491477251052856},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.2525021433830261}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.830533504486084},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.6963107585906982},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.6814931035041809},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5839062929153442},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5488243699073792},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30491477251052856},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.2525021433830261},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-024-01041-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-01041-1","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-01041-1","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:5a1864bf65764f8890a33f64865a5a95","is_oa":true,"landing_page_url":"https://doaj.org/article/5a1864bf65764f8890a33f64865a5a95","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 12, Iss 1, Pp 1-22 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-024-01041-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-01041-1","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-01041-1","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.47999998927116394}],"awards":[],"funders":[{"id":"https://openalex.org/F4320310801","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387"},{"id":"https://openalex.org/F4320317380","display_name":"Universidad del Atl\u00e1ntico","ror":"https://ror.org/05mm1w714"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406799292.pdf","grobid_xml":"https://content.openalex.org/works/W4406799292.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W1678356000","https://openalex.org/W1981276685","https://openalex.org/W2089468765","https://openalex.org/W2112796928","https://openalex.org/W2136655611","https://openalex.org/W2295598076","https://openalex.org/W2318680981","https://openalex.org/W2318802957","https://openalex.org/W2945876440","https://openalex.org/W2966860114","https://openalex.org/W2992495437","https://openalex.org/W3027745518","https://openalex.org/W4235730433","https://openalex.org/W4246413330","https://openalex.org/W4293771366","https://openalex.org/W4316020340","https://openalex.org/W4317040541","https://openalex.org/W4360764315","https://openalex.org/W4384521853","https://openalex.org/W4386274077","https://openalex.org/W4386274100","https://openalex.org/W4389989016"],"related_works":["https://openalex.org/W4393232657","https://openalex.org/W4390638272","https://openalex.org/W4205762803","https://openalex.org/W2472237121","https://openalex.org/W4323316863","https://openalex.org/W1985111449","https://openalex.org/W4304789336","https://openalex.org/W4405801673","https://openalex.org/W4386564352","https://openalex.org/W2952668426"],"abstract_inverted_index":{"Feature":[0],"selection":[1,41,54,95],"is":[2,56,85,112,145,162,180,199],"an":[3],"effective":[4],"data":[5,84,97,108,141,158],"reduction":[6,98],"technique.":[7],"SHapley":[8],"Additive":[9],"exPlanations":[10],"(SHAP)":[11],"can":[12,123,150],"be":[13,90,124,151,185],"used":[14,125,152],"to":[15,75,163,203],"provide":[16,164],"a":[17,39,114,147,165,205],"feature":[18,35,40,53,94,132,136,182,206],"importance":[19,36],"ranking":[20,37,48],"for":[21,64,96,104,130,135,157],"models":[22],"built":[23],"with":[24,99,128,155,187],"labeled":[25,83,140],"or":[26],"unlabeled":[27],"data.":[28,65],"Thus,":[29],"one":[30,110],"may":[31,184],"use":[32,67],"the":[33,45,60,68,172,193,200,211],"SHAP":[34,103,129,156,188],"in":[38,126,153,171,210],"technique":[42,55],"by":[43],"selecting":[44],"k":[46],"highest":[47],"features.":[49],"Furthermore,":[50],"this":[51,105,198],"SHAP-based":[52],"applicable":[57,209],"regardless":[58],"of":[59,62,109,168,195],"availability":[61,79,175,214],"labels":[63],"We":[66,92],"Kaggle":[69],"Credit":[70],"Card":[71],"Fraud":[72],"detection":[73],"dataset":[74],"simulate":[76],"three":[77,173,212],"label":[78,174,213],"scenarios.":[80,176,215],"When":[81,107],"no":[82],"available,":[86,113],"unsupervised":[87],"learners":[88],"should":[89],"used.":[91],"explore":[93,204],"Isolation":[100],"Forest":[101],"and":[102,134],"case.":[106],"class":[111],"one-class":[115],"classifier,":[116],"such":[117],"as":[118],"Gaussian":[119],"Mixture":[120],"Model":[121],"(GMM)":[122],"combination":[127],"determining":[131],"importance,":[133],"selection.":[137],"Finally,":[138],"if":[139],"from":[142],"both":[143],"classes":[144],"available":[146],"binary-class":[148],"classifier":[149],"conjunction":[154],"reduction.":[159],"Our":[160,177],"contribution":[161],"comparative":[166],"analysis":[167,207],"features":[169],"selected":[170],"primary":[178],"conclusion":[179],"that":[181],"sets":[183],"reduced":[186],"without":[189],"compromising":[190],"performance.":[191],"To":[192],"best":[194],"our":[196],"knowledge,":[197],"first":[201],"study":[202],"technique,":[208]},"counts_by_year":[{"year":2026,"cited_by_count":19},{"year":2025,"cited_by_count":32}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
