{"id":"https://openalex.org/W4409246334","doi":"https://doi.org/10.1021/acs.jcim.4c01982","title":"DirectMultiStep: Direct Route Generation for Multistep Retrosynthesis","display_name":"DirectMultiStep: Direct Route Generation for Multistep Retrosynthesis","publication_year":2025,"publication_date":"2025-04-08","ids":{"openalex":"https://openalex.org/W4409246334","doi":"https://doi.org/10.1021/acs.jcim.4c01982","pmid":"https://pubmed.ncbi.nlm.nih.gov/40197023"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.4c01982","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.4c01982","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032771309","display_name":"Yu Shee","orcid":"https://orcid.org/0000-0002-3728-0021"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yu Shee","raw_affiliation_strings":["Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075906555","display_name":"Anton Morgunov","orcid":"https://orcid.org/0009-0004-6245-0354"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anton Morgunov","raw_affiliation_strings":["Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071542127","display_name":"Haote Li","orcid":"https://orcid.org/0000-0002-8146-5066"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haote Li","raw_affiliation_strings":["Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089129603","display_name":"V\u00edctor S. Batista","orcid":"https://orcid.org/0000-0002-3262-1237"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Victor S. Batista","raw_affiliation_strings":["Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Yale University, P.O. Box 208107, New Haven, Connecticut 06520-8107, United States","institution_ids":["https://openalex.org/I32971472"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5089129603"],"corresponding_institution_ids":["https://openalex.org/I32971472"],"apc_list":null,"apc_paid":null,"fwci":7.0342,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.97128136,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"65","issue":"8","first_page":"3903","last_page":"3914"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11970","display_name":"Molecular Biology Techniques and Applications","score":0.9484999775886536,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9375,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/retrosynthetic-analysis","display_name":"Retrosynthetic analysis","score":0.8713051080703735},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4039555490016937},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.22479447722434998},{"id":"https://openalex.org/keywords/stereochemistry","display_name":"Stereochemistry","score":0.11814302206039429}],"concepts":[{"id":"https://openalex.org/C42437451","wikidata":"https://www.wikidata.org/wiki/Q902227","display_name":"Retrosynthetic analysis","level":3,"score":0.8713051080703735},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4039555490016937},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.22479447722434998},{"id":"https://openalex.org/C71240020","wikidata":"https://www.wikidata.org/wiki/Q186011","display_name":"Stereochemistry","level":1,"score":0.11814302206039429},{"id":"https://openalex.org/C35753019","wikidata":"https://www.wikidata.org/wiki/Q644785","display_name":"Total synthesis","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D060326","descriptor_name":"Chemistry Techniques, Synthetic","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D060326","descriptor_name":"Chemistry Techniques, Synthetic","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D060326","descriptor_name":"Chemistry Techniques, Synthetic","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.4c01982","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.4c01982","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:40197023","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40197023","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5509767062","display_name":null,"funder_award_id":"2124511","funder_id":"https://openalex.org/F4320337393","funder_display_name":"Division of Chemistry"}],"funders":[{"id":"https://openalex.org/F4320337393","display_name":"Division of Chemistry","ror":"https://ror.org/01ar8dr59"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W1997974358","https://openalex.org/W2042022967","https://openalex.org/W2064000318","https://openalex.org/W2580919858","https://openalex.org/W2607112153","https://openalex.org/W2621742623","https://openalex.org/W2747592475","https://openalex.org/W2769756736","https://openalex.org/W2899663614","https://openalex.org/W2908510526","https://openalex.org/W2964121744","https://openalex.org/W2969507301","https://openalex.org/W2970764640","https://openalex.org/W2981452123","https://openalex.org/W2987091515","https://openalex.org/W2991279511","https://openalex.org/W2994678679","https://openalex.org/W2998367408","https://openalex.org/W3009202547","https://openalex.org/W3009579421","https://openalex.org/W3010145447","https://openalex.org/W3013312987","https://openalex.org/W3014689923","https://openalex.org/W3036578548","https://openalex.org/W3087968351","https://openalex.org/W3088265803","https://openalex.org/W3094771832","https://openalex.org/W3119022334","https://openalex.org/W3120024000","https://openalex.org/W3125919803","https://openalex.org/W3152975457","https://openalex.org/W3169208069","https://openalex.org/W3174318304","https://openalex.org/W3175633940","https://openalex.org/W3181403764","https://openalex.org/W3189262114","https://openalex.org/W3189809547","https://openalex.org/W3201624628","https://openalex.org/W3205082678","https://openalex.org/W4205455490","https://openalex.org/W4220670676","https://openalex.org/W4226159083","https://openalex.org/W4229040393","https://openalex.org/W4283449818","https://openalex.org/W4285193863","https://openalex.org/W4288371066","https://openalex.org/W4293718192","https://openalex.org/W4378219995","https://openalex.org/W4387297831","https://openalex.org/W4390236774","https://openalex.org/W4390723197","https://openalex.org/W4402354716","https://openalex.org/W4407164079"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W1443743067","https://openalex.org/W4385784498","https://openalex.org/W4385842036","https://openalex.org/W4288371066","https://openalex.org/W4285670373","https://openalex.org/W2910734083","https://openalex.org/W3101473090"],"abstract_inverted_index":{"Traditional":[0],"computer-aided":[1],"synthesis":[2],"planning":[3],"(CASP)":[4],"methods":[5,69],"rely":[6],"on":[7,51,70,82,134,176],"iterative":[8],"single-step":[9],"predictions,":[10],"leading":[11],"to":[12,36],"exponential":[13],"search":[14],"space":[15],"growth":[16],"that":[17,29],"limits":[18],"efficiency":[19],"and":[20,76,85,100,110,136,142],"scalability.":[21],"We":[22],"introduce":[23],"a":[24,31,43,105,185],"series":[25],"of":[26,33,98,118,169],"transformer-based":[27],"models":[28,147],"leverage":[30],"mixture":[32],"experts":[34],"approach":[35,183],"directly":[37],"generate":[38],"multistep":[39],"synthetic":[40],"routes":[41,150],"as":[42,65,94],"single":[44],"string,":[45],"conditionally":[46],"predicting":[47],"each":[48],"transformation":[49],"based":[50],"all":[52],"preceding":[53],"ones.":[54],"Our":[55],"DMS":[56],"Explorer":[57],"XL":[58],"model,":[59],"which":[60],"requires":[61],"only":[62],"target":[63],"compounds":[64],"input,":[66],"outperforms":[67],"state-of-the-art":[68],"the":[71,83,95,116,123,152,158,166,170],"PaRoutes":[72],"dataset":[73],"with":[74],"1.9x":[75],"3.1x":[77],"improvements":[78],"in":[79,107,113,157],"Top-1":[80,135],"accuracy":[81],"n<sub>1</sub>":[84,141],"n<sub>5</sub>":[86,143],"test":[87],"sets,":[88],"respectively.":[89],"Providing":[90],"additional":[91],"information,":[92],"such":[93],"desired":[96],"number":[97],"steps":[99],"starting":[101],"materials,":[102],"enables":[103],"both":[104,140],"reduction":[106],"model":[108,130],"size":[109],"an":[111],"increase":[112],"accuracy,":[114],"highlighting":[115],"benefits":[117],"incorporating":[119],"more":[120],"constraints":[121],"into":[122],"prediction":[124],"process.":[125],"The":[126],"top-performing":[127],"DMS-Flex":[128],"(Duo)":[129],"scores":[131],"25-50%":[132],"higher":[133],"Top-10":[137],"accuracies":[138],"for":[139,151],"sets.":[144],"Additionally,":[145],"our":[146,181],"successfully":[148],"predict":[149],"FDA-approved":[153],"drugs":[154],"not":[155],"included":[156],"training":[159,171],"data,":[160],"demonstrating":[161],"strong":[162],"generalization":[163],"capabilities.":[164],"While":[165],"limited":[167],"diversity":[168],"set":[172],"may":[173],"affect":[174],"performance":[175],"less":[177],"common":[178],"reaction":[179],"types,":[180],"multistep-first":[182],"presents":[184],"promising":[186],"direction":[187],"toward":[188],"fully":[189],"automated":[190],"retrosynthetic":[191],"planning.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":4}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
