{"id":"https://openalex.org/W4385330045","doi":"https://doi.org/10.1021/acs.jcim.3c00396","title":"Interpretable Molecular Property Predictions Using Marginalized Graph Kernels","display_name":"Interpretable Molecular Property Predictions Using Marginalized Graph Kernels","publication_year":2023,"publication_date":"2023-07-28","ids":{"openalex":"https://openalex.org/W4385330045","doi":"https://doi.org/10.1021/acs.jcim.3c00396","pmid":"https://pubmed.ncbi.nlm.nih.gov/37504964"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.3c00396","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.3c00396","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100611584","display_name":"Yan Xiang","orcid":"https://orcid.org/0000-0003-4796-2912"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yan Xiang","raw_affiliation_strings":["Department of Biomedical Engineering, Duke University, Durham, North Carolina 27705, United States"],"affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, Duke University, Durham, North Carolina 27705, United States","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040471064","display_name":"Yuhang Tang","orcid":"https://orcid.org/0000-0001-7424-5439"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yu-Hang Tang","raw_affiliation_strings":["Computational Research Division, Lawrence Berkeley National Laboratory, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Computational Research Division, Lawrence Berkeley National Laboratory, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078138445","display_name":"Guang Lin","orcid":"https://orcid.org/0000-0002-0976-1987"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guang Lin","raw_affiliation_strings":["Department of Mathematics & School of Mechanical Engineering, Purdue University, West Lafayette, Indiana 47907, United States"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics & School of Mechanical Engineering, Purdue University, West Lafayette, Indiana 47907, United States","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020392456","display_name":"Daniel Reker","orcid":"https://orcid.org/0000-0003-4789-7380"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Daniel Reker","raw_affiliation_strings":["Department of Biomedical Engineering, Duke University, Durham, North Carolina 27705, United States"],"affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, Duke University, Durham, North Carolina 27705, United States","institution_ids":["https://openalex.org/I170897317"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020392456"],"corresponding_institution_ids":["https://openalex.org/I170897317"],"apc_list":null,"apc_paid":null,"fwci":0.6779,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.62765675,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"63","issue":"15","first_page":"4633","last_page":"4640"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9719215631484985},{"id":"https://openalex.org/keywords/kriging","display_name":"Kriging","score":0.6449733972549438},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5797547698020935},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5650493502616882},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5608291625976562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5496687293052673},{"id":"https://openalex.org/keywords/molecular-graph","display_name":"Molecular graph","score":0.46817225217819214},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.4487685561180115},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.4407445192337036},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4326178729534149},{"id":"https://openalex.org/keywords/attribution","display_name":"Attribution","score":0.4283842444419861},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42484864592552185},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3658360540866852},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3472026586532593},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2981921434402466},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.17805778980255127},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.09785374999046326},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.07275643944740295}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9719215631484985},{"id":"https://openalex.org/C81692654","wikidata":"https://www.wikidata.org/wiki/Q225926","display_name":"Kriging","level":2,"score":0.6449733972549438},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5797547698020935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5650493502616882},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5608291625976562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5496687293052673},{"id":"https://openalex.org/C2780022179","wikidata":"https://www.wikidata.org/wiki/Q1986794","display_name":"Molecular graph","level":3,"score":0.46817225217819214},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.4487685561180115},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.4407445192337036},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4326178729534149},{"id":"https://openalex.org/C143299363","wikidata":"https://www.wikidata.org/wiki/Q900584","display_name":"Attribution","level":2,"score":0.4283842444419861},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42484864592552185},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3658360540866852},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3472026586532593},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2981921434402466},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.17805778980255127},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.09785374999046326},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07275643944740295},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016011","descriptor_name":"Normal Distribution","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016011","descriptor_name":"Normal Distribution","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.3c00396","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.3c00396","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:37504964","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37504964","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309133","display_name":"Duke University","ror":"https://ror.org/00py81415"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1583837637","https://openalex.org/W1982597534","https://openalex.org/W2008505552","https://openalex.org/W2060531713","https://openalex.org/W2066532920","https://openalex.org/W2097851570","https://openalex.org/W2295107390","https://openalex.org/W2594183968","https://openalex.org/W2616247523","https://openalex.org/W2736101782","https://openalex.org/W2747592475","https://openalex.org/W2776454016","https://openalex.org/W2897970024","https://openalex.org/W2913954081","https://openalex.org/W2916327454","https://openalex.org/W2925177113","https://openalex.org/W2937307539","https://openalex.org/W2946617578","https://openalex.org/W2966357564","https://openalex.org/W2968071222","https://openalex.org/W2979411997","https://openalex.org/W3000120900","https://openalex.org/W3011127514","https://openalex.org/W3031603244","https://openalex.org/W3102564565","https://openalex.org/W3103176605","https://openalex.org/W3103523530","https://openalex.org/W3134420455","https://openalex.org/W3136815881","https://openalex.org/W3152893301","https://openalex.org/W3169334666","https://openalex.org/W4211049957","https://openalex.org/W4212774754","https://openalex.org/W4225984735","https://openalex.org/W4292756573","https://openalex.org/W4309258819","https://openalex.org/W6959636964"],"related_works":["https://openalex.org/W4385957992","https://openalex.org/W4229079080","https://openalex.org/W4206534706","https://openalex.org/W4385965371","https://openalex.org/W4386025632","https://openalex.org/W3006943036","https://openalex.org/W4200511449","https://openalex.org/W4299487748","https://openalex.org/W2983881875","https://openalex.org/W4321373706"],"abstract_inverted_index":{"Marginalized":[0],"graph":[1,49,73,93,119,179],"kernels":[2],"have":[3],"shown":[4],"competitive":[5],"performance":[6],"in":[7,24,138,173],"molecular":[8,31,86,127,184],"machine":[9,143],"learning":[10,144],"tasks":[11],"but":[12],"currently":[13],"lack":[14],"measures":[15,41,84],"of":[16,57,68,71,81,111,118,162,165,177],"interpretability,":[17],"which":[18],"are":[19],"important":[20,171],"to":[21,52,61,74,92],"improve":[22],"trust":[23],"the":[25,55,62,66,72,75,79,108,115,131,139,158,163,174],"models,":[26],"detect":[27],"biases,":[28],"and":[29,37,64,99,105,146,167],"inform":[30],"optimization":[32],"campaigns.":[33],"We":[34,77,89,122],"here":[35],"conceive":[36],"implement":[38],"two":[39,100],"interpretability":[40,83,164],"for":[42,85,182],"Gaussian":[43],"process":[44],"regression":[45],"using":[46,130],"a":[47,125],"marginalized":[48,178],"kernel":[50,180],"(GPR-MGK)":[51],"quantify":[53],"(1)":[54],"contribution":[56,67],"specific":[58,69],"training":[59,140],"data":[60,103,133,154],"prediction":[63],"(2)":[65],"nodes":[70],"prediction.":[76,88],"demonstrate":[78],"applicability":[80],"these":[82],"property":[87],"compare":[90],"GPR-MGK":[91,112,166],"neural":[94,120],"networks":[95],"on":[96,152],"four":[97],"logic":[98],"real-world":[101],"toxicology":[102],"sets":[104],"find":[106],"that":[107],"atomic":[109,116],"attribution":[110,117,128],"generally":[113],"outperforms":[114],"networks.":[121],"also":[123],"perform":[124,150],"detailed":[126],"analysis":[129],"FreeSolv":[132],"set,":[134],"showing":[135],"how":[136],"molecules":[137],"set":[141],"influence":[142],"predictions":[145],"why":[147],"Morgan":[148],"fingerprints":[149],"poorly":[151],"this":[153],"set.":[155],"This":[156],"is":[157,169],"first":[159],"systematic":[160],"examination":[161],"thereby":[168],"an":[170],"step":[172],"further":[175],"maturation":[176],"methods":[181],"interpretable":[183],"predictions.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
