{"id":"https://openalex.org/W3112693917","doi":"https://doi.org/10.1021/acs.jcim.0c00899","title":"<i>Chespa</i>: Streamlining Expansive Chemical Space Evaluation of Molecular Sets","display_name":"<i>Chespa</i>: Streamlining Expansive Chemical Space Evaluation of Molecular Sets","publication_year":2020,"publication_date":"2020-12-07","ids":{"openalex":"https://openalex.org/W3112693917","doi":"https://doi.org/10.1021/acs.jcim.0c00899","mag":"3112693917","pmid":"https://pubmed.ncbi.nlm.nih.gov/33283505"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.0c00899","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.0c00899","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9648166","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038344776","display_name":"Jamie Nu\u00f1ez","orcid":"https://orcid.org/0000-0002-8594-1648"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]},{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jamie R. Nu\u00f1ez","raw_affiliation_strings":["Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States"],"affiliations":[{"raw_affiliation_string":"Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000979385","display_name":"Monee McGrady","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Monee Mcgrady","raw_affiliation_strings":["Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States"],"affiliations":[{"raw_affiliation_string":"Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085982027","display_name":"Yasemin Yesiltepe","orcid":"https://orcid.org/0000-0001-9437-2347"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]},{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yasemin Yesiltepe","raw_affiliation_strings":["Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States"],"affiliations":[{"raw_affiliation_string":"Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051101756","display_name":"Ryan Renslow","orcid":"https://orcid.org/0000-0002-3969-5570"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]},{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ryan S. Renslow","raw_affiliation_strings":["Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States"],"affiliations":[{"raw_affiliation_string":"Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"The Gene and Linda Voiland School of Chemical Engineering and Bioengineering, Washington State University, Pullman, Washington 99164, United States","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034592694","display_name":"Thomas Metz","orcid":"https://orcid.org/0000-0001-6049-3968"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Thomas O. Metz","raw_affiliation_strings":["Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States"],"affiliations":[{"raw_affiliation_string":"Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory, Richland, Washington 99352, United States","institution_ids":["https://openalex.org/I142606810"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5034592694","https://openalex.org/A5051101756"],"corresponding_institution_ids":["https://openalex.org/I142606810","https://openalex.org/I72951846"],"apc_list":null,"apc_paid":null,"fwci":0.5629,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.74034726,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":96},"biblio":{"volume":"60","issue":"12","first_page":"6251","last_page":"6257"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chemical-space","display_name":"Chemical space","score":0.8705337643623352},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5845211148262024},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.5048838257789612},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4729737341403961},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4491517245769501},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.43443363904953003},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.43176645040512085},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4315839409828186},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.2753239572048187},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2662743926048279},{"id":"https://openalex.org/keywords/drug-discovery","display_name":"Drug discovery","score":0.17635884881019592}],"concepts":[{"id":"https://openalex.org/C99726746","wikidata":"https://www.wikidata.org/wiki/Q906396","display_name":"Chemical space","level":3,"score":0.8705337643623352},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5845211148262024},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.5048838257789612},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4729737341403961},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4491517245769501},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.43443363904953003},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.43176645040512085},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4315839409828186},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.2753239572048187},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2662743926048279},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.17635884881019592},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D013058","descriptor_name":"Mass Spectrometry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013058","descriptor_name":"Mass Spectrometry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013058","descriptor_name":"Mass Spectrometry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1021/acs.jcim.0c00899","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.0c00899","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:33283505","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33283505","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:9648166","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9648166","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:9648166","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9648166","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals","score":0.4399999976158142}],"awards":[{"id":"https://openalex.org/G1598349242","display_name":null,"funder_award_id":"U2CES030170","funder_id":"https://openalex.org/F4320337361","funder_display_name":"National Institute of Environmental Health Sciences"}],"funders":[{"id":"https://openalex.org/F4320337361","display_name":"National Institute of Environmental Health Sciences","ror":"https://ror.org/00j4k1h63"},{"id":"https://openalex.org/F4320337547","display_name":"Laboratory Directed Research and Development","ror":"https://ror.org/01e41cf67"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W625776585","https://openalex.org/W1592371672","https://openalex.org/W1963879600","https://openalex.org/W1967544219","https://openalex.org/W1971097535","https://openalex.org/W1987971958","https://openalex.org/W1992397471","https://openalex.org/W1997481671","https://openalex.org/W2011301426","https://openalex.org/W2016717705","https://openalex.org/W2017254234","https://openalex.org/W2017360600","https://openalex.org/W2023818227","https://openalex.org/W2026834364","https://openalex.org/W2035753075","https://openalex.org/W2073459066","https://openalex.org/W2075155287","https://openalex.org/W2101234009","https://openalex.org/W2110791536","https://openalex.org/W2129411266","https://openalex.org/W2146292423","https://openalex.org/W2169678694","https://openalex.org/W2292369104","https://openalex.org/W2519454444","https://openalex.org/W2548357532","https://openalex.org/W2596398464","https://openalex.org/W2773987374","https://openalex.org/W2779125761","https://openalex.org/W2791355014","https://openalex.org/W2886900553","https://openalex.org/W2898108532","https://openalex.org/W2905511466","https://openalex.org/W2911354688","https://openalex.org/W2913351693","https://openalex.org/W2956136703","https://openalex.org/W2963609389","https://openalex.org/W2972741532","https://openalex.org/W2982596783","https://openalex.org/W3014785674","https://openalex.org/W3033617175","https://openalex.org/W3100751385","https://openalex.org/W3112682090","https://openalex.org/W3164669644","https://openalex.org/W6969145360","https://openalex.org/W6969259846"],"related_works":["https://openalex.org/W2046459260","https://openalex.org/W2765830098","https://openalex.org/W2967463586","https://openalex.org/W1971989957","https://openalex.org/W2517338020","https://openalex.org/W3157641275","https://openalex.org/W4312300846","https://openalex.org/W4206221578","https://openalex.org/W3029572990","https://openalex.org/W2615757685"],"abstract_inverted_index":{"Thousands":[0],"of":[1,21,32,61,69,79,121,133,163,178,193,229],"chemical":[2,40,56,84,89,92,101,238],"properties":[3],"can":[4,11],"be":[5,12,125],"calculated":[6],"for":[7,37,237],"small":[8],"molecules,":[9],"which":[10],"used":[13],"to":[14,52,97,124,189,204],"place":[15],"the":[16,19,35,38,119,134,143,187,191],"molecules":[17],"within":[18],"context":[20],"a":[22,46,122,131,210,234],"broader":[23],"\"chemical":[24],"space.\"":[25],"These":[26],"definitions":[27,58,110],"vary":[28],"based":[29,181],"on":[30,182],"compounds":[31,62],"interest":[33],"and":[34,66,91,215,233],"goals":[36],"given":[39],"space":[41,57,102,239],"definition.":[42],"Here,":[43],"we":[44,105],"introduce":[45],"customizable":[47],"Python":[48],"module,":[49],"<i>chespa</i>,":[50],"built":[51],"easily":[53],"assess":[54],"different":[55,100],"through":[59],"clustering":[60],"in":[63,95,169,207,218],"these":[64,70,108],"spaces":[65],"visualizing":[67],"trends":[68],"clusters.":[71],"To":[72],"demonstrate":[73],"this,":[74],"<i>chespa</i>":[75],"currently":[76],"streamlines":[77],"prediction":[78,228],"various":[80],"molecular":[81,86],"descriptors":[82],"(predicted":[83],"properties,":[85],"substructures,":[87],"AI-based":[88],"space,":[90],"class":[93],"ontology)":[94],"order":[96],"test":[98],"six":[99],"definitions.":[103],"Furthermore,":[104],"investigated":[106],"how":[107],"varying":[109],"trend":[111],"with":[112,127],"mass":[113],"spectrometry":[114],"(MS)-based":[115],"observability,":[116],"that":[117],"is,":[118],"ability":[120,188],"molecule":[123,135],"observed":[126],"MS":[128],"(e.g.,":[129],"as":[130,173],"function":[132],"ionizability),":[136],"using":[137],"an":[138],"example":[139],"data":[140,159],"set":[141],"from":[142],"U.S.":[144],"EPA's":[145],"nontargeted":[146],"analysis":[147],"collaborative":[148],"trial,":[149],"where":[150],"blinded":[151],"samples":[152],"had":[153],"been":[154],"analyzed":[155],"previously,":[156],"providing":[157],"1398":[158],"points.":[160],"Improved":[161],"understanding":[162],"observability":[164,222],"would":[165],"offer":[166],"many":[167],"advantages":[168],"small-molecule":[170],"identification,":[171],"such":[172],"(i)":[174],"<i>a":[175],"priori</i>":[176],"selection":[177],"experimental":[179],"conditions":[180],"suspected":[183],"sample":[184],"composition,":[185],"(ii)":[186],"reduce":[190],"number":[192],"candidate":[194,236],"structures":[195],"during":[196],"compound":[197],"identification":[198],"by":[199],"removing":[200],"those":[201],"less":[202],"likely":[203],"ionize,":[205],"and,":[206],"turn,":[208],"(iii)":[209],"reduced":[211],"false":[212],"discovery":[213],"rate":[214],"increased":[216],"confidence":[217],"identifications.":[219],"Factors":[220],"controlling":[221],"are":[223],"not":[224],"fully":[225],"understood,":[226],"making":[227],"this":[230],"property":[231],"nontrivial":[232],"prime":[235],"analysis.":[240],"<i>Chespa</i>":[241],"is":[242],"available":[243],"at":[244],"github.com/pnnl/chespa.":[245]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
