{"id":"https://openalex.org/W3006394635","doi":"https://doi.org/10.1021/acs.jcim.9b01080","title":"Toward a Comprehensive Treatment of Tautomerism in Chemoinformatics Including in InChI V2","display_name":"Toward a Comprehensive Treatment of Tautomerism in Chemoinformatics Including in InChI V2","publication_year":2020,"publication_date":"2020-02-11","ids":{"openalex":"https://openalex.org/W3006394635","doi":"https://doi.org/10.1021/acs.jcim.9b01080","mag":"3006394635","pmid":"https://pubmed.ncbi.nlm.nih.gov/32043883"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.9b01080","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.9b01080","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/8459712","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065243838","display_name":"Devendra K. Dhaked","orcid":"https://orcid.org/0000-0001-6349-7649"},"institutions":[{"id":"https://openalex.org/I4210130649","display_name":"Frederick National Laboratory for Cancer Research","ror":"https://ror.org/03v6m3209","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210130649","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210140884","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210149717","display_name":"Center for Cancer Research","ror":"https://ror.org/05bjen692","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Devendra K. Dhaked","raw_affiliation_strings":["Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States"],"raw_orcid":"https://orcid.org/0000-0001-6349-7649","affiliations":[{"raw_affiliation_string":"Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States","institution_ids":["https://openalex.org/I4210130649","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024670976","display_name":"Wolf D. Ihlenfeldt","orcid":"https://orcid.org/0000-0002-1973-1271"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wolf-Dietrich Ihlenfeldt","raw_affiliation_strings":["Xemistry GmbH, Hainholzweg 11, D-61479 Glash\u00fctten, Germany"],"raw_orcid":"https://orcid.org/0000-0002-1973-1271","affiliations":[{"raw_affiliation_string":"Xemistry GmbH, Hainholzweg 11, D-61479 Glash\u00fctten, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027458236","display_name":"Hitesh Patel","orcid":"https://orcid.org/0000-0003-3329-0377"},"institutions":[{"id":"https://openalex.org/I4210130649","display_name":"Frederick National Laboratory for Cancer Research","ror":"https://ror.org/03v6m3209","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210130649","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210140884","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210149717","display_name":"Center for Cancer Research","ror":"https://ror.org/05bjen692","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hitesh Patel","raw_affiliation_strings":["Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States"],"raw_orcid":"https://orcid.org/0000-0003-3329-0377","affiliations":[{"raw_affiliation_string":"Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States","institution_ids":["https://openalex.org/I4210130649","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057371213","display_name":"Victorien Delann\u00e9e","orcid":"https://orcid.org/0000-0002-5776-0129"},"institutions":[{"id":"https://openalex.org/I4210130649","display_name":"Frederick National Laboratory for Cancer Research","ror":"https://ror.org/03v6m3209","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210130649","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210140884","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210149717","display_name":"Center for Cancer Research","ror":"https://ror.org/05bjen692","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Victorien Delann\u00e9e","raw_affiliation_strings":["Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States"],"raw_orcid":"https://orcid.org/0000-0002-5776-0129","affiliations":[{"raw_affiliation_string":"Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States","institution_ids":["https://openalex.org/I4210130649","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078864876","display_name":"Marc C. Nicklaus","orcid":"https://orcid.org/0000-0002-4775-7030"},"institutions":[{"id":"https://openalex.org/I4210130649","display_name":"Frederick National Laboratory for Cancer Research","ror":"https://ror.org/03v6m3209","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210130649","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210140884","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884"]},{"id":"https://openalex.org/I4210149717","display_name":"Center for Cancer Research","ror":"https://ror.org/05bjen692","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Marc C. Nicklaus","raw_affiliation_strings":["Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States"],"raw_orcid":"https://orcid.org/0000-0002-4775-7030","affiliations":[{"raw_affiliation_string":"Computer-Aided Drug Design Group, Chemical Biology Laboratory, Center for Cancer Research, National Cancer Institute, NIH, Frederick, Maryland 21702, United States","institution_ids":["https://openalex.org/I4210130649","https://openalex.org/I4210140884","https://openalex.org/I4210149717"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5078864876"],"corresponding_institution_ids":["https://openalex.org/I4210130649","https://openalex.org/I4210140884","https://openalex.org/I4210149717"],"apc_list":null,"apc_paid":null,"fwci":3.6129,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.94169464,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"60","issue":"3","first_page":"1253","last_page":"1275"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11407","display_name":"Innovative Microfluidic and Catalytic Techniques Innovation","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cheminformatics","display_name":"Cheminformatics","score":0.9208158254623413},{"id":"https://openalex.org/keywords/tautomer","display_name":"Tautomer","score":0.7999536395072937},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.48093289136886597},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3958008587360382},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.34878072142601013},{"id":"https://openalex.org/keywords/computational-chemistry","display_name":"Computational chemistry","score":0.31635773181915283},{"id":"https://openalex.org/keywords/medicinal-chemistry","display_name":"Medicinal chemistry","score":0.19573789834976196},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.14745372533798218}],"concepts":[{"id":"https://openalex.org/C68762167","wikidata":"https://www.wikidata.org/wiki/Q910164","display_name":"Cheminformatics","level":2,"score":0.9208158254623413},{"id":"https://openalex.org/C111233374","wikidata":"https://www.wikidata.org/wiki/Q334640","display_name":"Tautomer","level":2,"score":0.7999536395072937},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.48093289136886597},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3958008587360382},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.34878072142601013},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.31635773181915283},{"id":"https://openalex.org/C155647269","wikidata":"https://www.wikidata.org/wiki/Q243455","display_name":"Medicinal chemistry","level":1,"score":0.19573789834976196},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.14745372533798218}],"mesh":[{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1021/acs.jcim.9b01080","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.9b01080","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:32043883","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32043883","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:europepmc.org:7349494","is_oa":false,"landing_page_url":"http://europepmc.org/pmc/articles/PMC8459712","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},{"id":"pmh:oai:pubmedcentral.nih.gov:8459712","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/8459712","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:8459712","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/8459712","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"},"sustainable_development_goals":[{"score":0.4300000071525574,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320337351","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W192194939","https://openalex.org/W1508604947","https://openalex.org/W1545406574","https://openalex.org/W1975147762","https://openalex.org/W1983283443","https://openalex.org/W2012961504","https://openalex.org/W2016455326","https://openalex.org/W2045873232","https://openalex.org/W2050226017","https://openalex.org/W2083836648","https://openalex.org/W2087563523","https://openalex.org/W2097186436","https://openalex.org/W2177317049","https://openalex.org/W2523800160","https://openalex.org/W2541404351","https://openalex.org/W2558999090","https://openalex.org/W2767891136","https://openalex.org/W3002554271","https://openalex.org/W3004704740","https://openalex.org/W4229513077"],"related_works":["https://openalex.org/W4297103231","https://openalex.org/W2006553579","https://openalex.org/W2070940942","https://openalex.org/W2015887350","https://openalex.org/W2106027604","https://openalex.org/W2361129091","https://openalex.org/W2082158222","https://openalex.org/W4323359560","https://openalex.org/W2884165437","https://openalex.org/W2744233384"],"abstract_inverted_index":{"We":[0],"have":[1,32],"collected":[2],"86":[3],"different":[4],"transforms":[5],"of":[6,10,29,45,57,89,121,129,138,140,159],"tautomeric":[7,170],"interconversions.":[8],"Out":[9],"those,":[11],"54":[12],"are":[13,124],"for":[14,19,24,142],"prototropic":[15],"(non-ring-chain)":[16],"tautomerism,":[17,21,50],"21":[18],"ring-chain":[20],"and":[22,87,102,112,118],"11":[23],"valence":[25],"tautomerism.":[26],"The":[27,64],"majority":[28],"these":[30,183],"rules":[31,65,149,184],"been":[33,179],"extracted":[34],"from":[35,53],"experimental":[36],"literature.":[37],"Twenty":[38],"rules,":[39],"covering":[40],"the":[41,54,60,90,107,119,127,130,136,148,157],"most":[42],"well-known":[43],"types":[44],"tautomerism":[46,58,141],"such":[47],"as":[48,78],"keto-enol":[49],"were":[51,66],"taken":[52],"default":[55],"handling":[56,139],"by":[59,95,169,172],"chemoinformatics":[61],"toolkit":[62],"CACTVS.":[63],"analyzed":[67],"against":[68],"nine":[69],"differerent":[70],"databases":[71,164],"totaling":[72],"over":[73],"400":[74],"million":[75],"(non-unique)":[76],"structures":[77],"to":[79,181],"their":[80],"occurrence":[81],"rates,":[82],"mutual":[83],"overlap":[84],"in":[85,99,126,151,161],"coverage,":[86],"recapitulation":[88],"rules'":[91],"enumerated":[92],"tautomer":[93],"sets":[94],"InChI":[96,132,144,173],"V.1.05,":[97],"both":[98],"InChI's":[100],"Standard":[101],"a":[103],"Nonstandard":[104],"version":[105,145],"with":[106,135],"increased":[108],"tautomer-handling":[109],"options":[110],"15T":[111],"KET":[113],"turned":[114],"on.":[115],"These":[116],"results":[117],"background":[120],"this":[122,152],"study":[123],"discussed":[125],"context":[128],"IUPAC":[131],"Project":[133],"tasked":[134],"redesign":[137],"an":[143],"2.":[146],"Applying":[147],"presented":[150],"paper":[153],"would":[154,166],"approximately":[155],"triple":[156],"number":[158],"compounds":[160],"typical":[162],"small-molecule":[163],"that":[165],"be":[167],"affected":[168],"interconversion":[171],"V2.":[174],"A":[175],"web":[176],"tool":[177],"has":[178],"created":[180],"test":[182],"at":[185],"https://cactus.nci.nih.gov/tautomerizer.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
