{"id":"https://openalex.org/W7139960898","doi":"https://doi.org/10.48550/arxiv.2603.19141","title":"SHAPCA: Consistent and Interpretable Explanations for Machine Learning Models on Spectroscopy Data","display_name":"SHAPCA: Consistent and Interpretable Explanations for Machine Learning Models on Spectroscopy Data","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139960898","doi":"https://doi.org/10.48550/arxiv.2603.19141"},"language":"en","primary_location":{"id":"pmh:oai:cora.ucc.ie:10468/18687","is_oa":true,"landing_page_url":"https://hdl.handle.net/10468/18687","pdf_url":null,"source":{"id":"https://openalex.org/S4306400766","display_name":"Cork Open Research Archive (University College Cork)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I27577105","host_organization_name":"University College Cork","host_organization_lineage":["https://openalex.org/I27577105"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/acceptedVersion"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/10468/18687","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100621291","display_name":"Mingxing Zhang","orcid":"https://orcid.org/0000-0001-8363-6968"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Mingxing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099178888","display_name":"Nicola Rossberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rossberg, Nicola","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099178893","display_name":"Simone Innocente","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Innocente, Simone","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032885126","display_name":"Katarzyna Komolibus","orcid":"https://orcid.org/0000-0003-4545-6100"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Komolibus, Katarzyna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046368790","display_name":"Rekha Gautam","orcid":"https://orcid.org/0000-0002-1176-8491"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gautam, Rekha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130248288","display_name":"Barry O'Sullivan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"O'Sullivan, Barry","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130222270","display_name":"Luca Longo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Longo, Luca","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045006994","display_name":"Andrea Visentin","orcid":"https://orcid.org/0000-0003-3702-4826"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Visentin, Andrea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100621291"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.27379998564720154,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.27379998564720154,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11324","display_name":"Spectroscopy Techniques in Biomedical and Chemical Research","score":0.15369999408721924,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.11699999868869781,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9514999985694885},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6879000067710876},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.6610999703407288},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.569599986076355},{"id":"https://openalex.org/keywords/collinearity","display_name":"Collinearity","score":0.5622000098228455},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.49790000915527344},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4964999854564667},{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.39959999918937683},{"id":"https://openalex.org/keywords/exploratory-data-analysis","display_name":"Exploratory data analysis","score":0.35740000009536743}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9514999985694885},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7595000267028809},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7282000184059143},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6879000067710876},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.6610999703407288},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5899999737739563},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.569599986076355},{"id":"https://openalex.org/C106192678","wikidata":"https://www.wikidata.org/wiki/Q1419761","display_name":"Collinearity","level":2,"score":0.5622000098228455},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.49790000915527344},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4964999854564667},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.39959999918937683},{"id":"https://openalex.org/C120894424","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory data analysis","level":2,"score":0.35740000009536743},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3515999913215637},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3327000141143799},{"id":"https://openalex.org/C55037315","wikidata":"https://www.wikidata.org/wiki/Q5421151","display_name":"Experimental data","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.2838999927043915},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.28200000524520874},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2662000060081482},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.25209999084472656},{"id":"https://openalex.org/C3018260909","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory analysis","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:cora.ucc.ie:10468/18687","is_oa":true,"landing_page_url":"https://hdl.handle.net/10468/18687","pdf_url":null,"source":{"id":"https://openalex.org/S4306400766","display_name":"Cork Open Research Archive (University College Cork)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I27577105","host_organization_name":"University College Cork","host_organization_lineage":["https://openalex.org/I27577105"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/acceptedVersion"},{"id":"doi:10.48550/arxiv.2603.19141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:cora.ucc.ie:10468/18687","is_oa":true,"landing_page_url":"https://hdl.handle.net/10468/18687","pdf_url":null,"source":{"id":"https://openalex.org/S4306400766","display_name":"Cork Open Research Archive (University College Cork)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I27577105","host_organization_name":"University College Cork","host_organization_lineage":["https://openalex.org/I27577105"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/acceptedVersion"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"machine":[3,117],"learning":[4,118],"models":[5],"have":[6,90],"been":[7,91],"increasingly":[8],"applied":[9],"to":[10,34,58,78,93,136,152],"spectroscopic":[11],"datasets":[12],"for":[13],"chemical":[14],"and":[15,25,29,36,48,73,107,128,149,164,194],"biomedical":[16],"analysis.":[17],"For":[18],"their":[19],"successful":[20],"adoption,":[21],"particularly":[22],"in":[23,80,139],"clinical":[24],"safety-critical":[26],"settings,":[27],"professionals":[28],"researchers":[30],"must":[31],"be":[32],"able":[33],"understand":[35],"trust":[37],"the":[38,44,71,95,102,105,108,140,153,168,179,189,192],"reasoning":[39],"behind":[40],"model":[41,59,66,174],"predictions.":[42,185],"However,":[43],"inherently":[45],"high":[46],"dimensionality":[47,126],"strong":[49],"collinearity":[50],"of":[51,75,191],"spectroscopy":[52],"data":[53],"pose":[54],"a":[55,145],"fundamental":[56],"challenge":[57],"explainability.":[60],"These":[61],"properties":[62],"not":[63],"only":[64],"complicate":[65],"training":[67,85],"but":[68],"also":[69],"undermine":[70],"stability":[72],"consistency":[74,196],"explanations,":[76],"leading":[77],"fluctuations":[79],"feature":[81],"importance":[82],"across":[83,197],"repeated":[84],"runs.":[86,199],"Feature":[87],"extraction":[88],"techniques":[89],"used":[92],"reduce":[94],"input":[96,142],"dimensionality;":[97],"these":[98],"new":[99],"features":[100,181],"hinder":[101],"connection":[103],"between":[104],"prediction":[106],"original":[109,141],"signal.":[110],"This":[111],"study":[112],"proposes":[113],"SHAPCA,":[114],"an":[115],"explainable":[116],"pipeline":[119],"that":[120,171,182],"combines":[121],"Principal":[122],"Component":[123],"Analysis":[124],"(for":[125,132],"reduction)":[127],"Shapely":[129],"Additive":[130],"exPlanations":[131],"post":[133],"hoc":[134],"explanation)":[135],"provide":[137],"explanations":[138],"space,":[143],"which":[144],"practitioner":[146],"can":[147],"interpret":[148],"link":[150],"back":[151],"biological":[154],"components.":[155],"The":[156],"proposed":[157],"framework":[158],"enables":[159],"analysis":[160,187],"from":[161],"both":[162],"global":[163],"local":[165],"perspectives,":[166],"revealing":[167],"spectral":[169],"bands":[170],"drive":[172],"overall":[173],"behaviour":[175],"as":[176,178],"well":[177],"instance-specific":[180],"influence":[183],"individual":[184],"Numerical":[186],"demonstrated":[188],"interpretability":[190],"results":[193],"greater":[195],"different":[198]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2026-03-21T00:00:00"}
