{"id":"https://openalex.org/W4408925102","doi":"https://doi.org/10.1021/acs.jcim.5c00167","title":"Prediction of Chromatographic Retention Time of a Small Molecule from SMILES Representation Using a Hybrid Transformer-LSTM Model","display_name":"Prediction of Chromatographic Retention Time of a Small Molecule from SMILES Representation Using a Hybrid Transformer-LSTM Model","publication_year":2025,"publication_date":"2025-03-28","ids":{"openalex":"https://openalex.org/W4408925102","doi":"https://doi.org/10.1021/acs.jcim.5c00167","pmid":"https://pubmed.ncbi.nlm.nih.gov/40152775"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c00167","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00167","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027300762","display_name":"Sargol Mazraedoost","orcid":"https://orcid.org/0000-0001-6656-1968"},"institutions":[{"id":"https://openalex.org/I8991828","display_name":"Pukyong National University","ror":"https://ror.org/0433kqc49","country_code":"KR","type":"education","lineage":["https://openalex.org/I8991828"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sargol Mazraedoost","raw_affiliation_strings":["Department of Chemical Engineering","Pukyong National University","Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Chemical Engineering","institution_ids":[]},{"raw_affiliation_string":"Pukyong National University","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094210709","display_name":"Hadi Sedigh Malekroodi","orcid":"https://orcid.org/0009-0001-1958-1525"},"institutions":[{"id":"https://openalex.org/I1297592001","display_name":"Bionics Institute","ror":"https://ror.org/05e4f1b55","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1297592001"]},{"id":"https://openalex.org/I4210147194","display_name":"Convergence","ror":"https://ror.org/03kcznq08","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210147194"]},{"id":"https://openalex.org/I8991828","display_name":"Pukyong National University","ror":"https://ror.org/0433kqc49","country_code":"KR","type":"education","lineage":["https://openalex.org/I8991828"]}],"countries":["AU","KR","US"],"is_corresponding":false,"raw_author_name":"Hadi Sedigh Malekroodi","raw_affiliation_strings":["Industry 4.0 Convergence Bionics Engineering","Pukyong National University","Industry 4.0 Convergence Bionics Engineering, Pukyong National University, Busan 48513, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Industry 4.0 Convergence Bionics Engineering","institution_ids":["https://openalex.org/I1297592001","https://openalex.org/I4210147194"]},{"raw_affiliation_string":"Pukyong National University","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Industry 4.0 Convergence Bionics Engineering, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002854147","display_name":"Petar \u017duvela","orcid":"https://orcid.org/0000-0001-6481-2241"},"institutions":[{"id":"https://openalex.org/I8991828","display_name":"Pukyong National University","ror":"https://ror.org/0433kqc49","country_code":"KR","type":"education","lineage":["https://openalex.org/I8991828"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Petar \u017duvela","raw_affiliation_strings":["Department of Chemical Engineering","Pukyong National University","Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Chemical Engineering","institution_ids":[]},{"raw_affiliation_string":"Pukyong National University","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010623403","display_name":"Myunggi Yi","orcid":"https://orcid.org/0000-0003-4864-959X"},"institutions":[{"id":"https://openalex.org/I1297592001","display_name":"Bionics Institute","ror":"https://ror.org/05e4f1b55","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1297592001"]},{"id":"https://openalex.org/I4210147194","display_name":"Convergence","ror":"https://ror.org/03kcznq08","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210147194"]},{"id":"https://openalex.org/I8991828","display_name":"Pukyong National University","ror":"https://ror.org/0433kqc49","country_code":"KR","type":"education","lineage":["https://openalex.org/I8991828"]}],"countries":["AU","KR","US"],"is_corresponding":false,"raw_author_name":"Myunggi Yi","raw_affiliation_strings":["Industry 4.0 Convergence Bionics Engineering","Major of Biomedical Engineering, Division of Smart Healthcare","Pukyong National University","Industry 4.0 Convergence Bionics Engineering, Pukyong National University, Busan 48513, Republic of Korea","Major of Biomedical Engineering, Division of Smart Healthcare, Pukyong National University, Busan 48513, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Industry 4.0 Convergence Bionics Engineering","institution_ids":["https://openalex.org/I1297592001","https://openalex.org/I4210147194"]},{"raw_affiliation_string":"Major of Biomedical Engineering, Division of Smart Healthcare","institution_ids":[]},{"raw_affiliation_string":"Pukyong National University","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Industry 4.0 Convergence Bionics Engineering, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Major of Biomedical Engineering, Division of Smart Healthcare, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004823439","display_name":"Jay Liu","orcid":"https://orcid.org/0000-0003-4274-2355"},"institutions":[{"id":"https://openalex.org/I8991828","display_name":"Pukyong National University","ror":"https://ror.org/0433kqc49","country_code":"KR","type":"education","lineage":["https://openalex.org/I8991828"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"J. Jay Liu","raw_affiliation_strings":["Department of Chemical Engineering","Institute of Cleaner Production Technology Pukyong National University, 45, Yongso-Ro, Nam-Gu, Busan 48513, South Korea","Pukyong National University","Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Chemical Engineering","institution_ids":[]},{"raw_affiliation_string":"Institute of Cleaner Production Technology Pukyong National University, 45, Yongso-Ro, Nam-Gu, Busan 48513, South Korea","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Pukyong National University","institution_ids":["https://openalex.org/I8991828"]},{"raw_affiliation_string":"Department of Chemical Engineering, Pukyong National University, Busan 48513, Republic of Korea","institution_ids":["https://openalex.org/I8991828"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5004823439"],"corresponding_institution_ids":["https://openalex.org/I8991828"],"apc_list":null,"apc_paid":null,"fwci":10.6514,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.98258643,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"65","issue":"7","first_page":"3343","last_page":"3356"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11124","display_name":"Protein purification and stability","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/retention-time","display_name":"Retention time","score":0.7039846181869507},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6628405451774597},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.517932116985321},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.46177542209625244},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.45258814096450806},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3533933460712433},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.32222601771354675},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11234128475189209},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.07123681902885437},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.06184345483779907}],"concepts":[{"id":"https://openalex.org/C3020018676","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Retention time","level":2,"score":0.7039846181869507},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6628405451774597},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.517932116985321},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.46177542209625244},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45258814096450806},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3533933460712433},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.32222601771354675},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11234128475189209},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.07123681902885437},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.06184345483779907},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D002851","descriptor_name":"Chromatography, High Pressure Liquid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D002851","descriptor_name":"Chromatography, High Pressure Liquid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013997","descriptor_name":"Time Factors","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013997","descriptor_name":"Time Factors","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D056148","descriptor_name":"Chromatography, Reverse-Phase","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D056148","descriptor_name":"Chromatography, Reverse-Phase","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.5c00167","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00167","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:40152775","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40152775","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2384748037","display_name":null,"funder_award_id":"RS-2024-00337129","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"}],"funders":[{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W129305155","https://openalex.org/W1557141846","https://openalex.org/W1983478747","https://openalex.org/W1988037271","https://openalex.org/W2032559740","https://openalex.org/W2049133822","https://openalex.org/W2064675550","https://openalex.org/W2087563523","https://openalex.org/W2265106087","https://openalex.org/W2408969840","https://openalex.org/W2594183968","https://openalex.org/W2892186999","https://openalex.org/W2896457183","https://openalex.org/W2908336004","https://openalex.org/W2908510526","https://openalex.org/W2914609306","https://openalex.org/W2919115771","https://openalex.org/W2965373594","https://openalex.org/W2972498877","https://openalex.org/W2996714860","https://openalex.org/W3023204497","https://openalex.org/W3080359515","https://openalex.org/W3093934881","https://openalex.org/W3094450043","https://openalex.org/W3118642024","https://openalex.org/W3128640640","https://openalex.org/W3212001303","https://openalex.org/W3214385661","https://openalex.org/W4200240219","https://openalex.org/W4200573776","https://openalex.org/W4206313288","https://openalex.org/W4213070269","https://openalex.org/W4244050815","https://openalex.org/W4281778378","https://openalex.org/W4293543509","https://openalex.org/W4297179162","https://openalex.org/W4297988964","https://openalex.org/W4303982455","https://openalex.org/W4304809666","https://openalex.org/W4387614160","https://openalex.org/W4388626524","https://openalex.org/W4392143551","https://openalex.org/W4393005262","https://openalex.org/W4402570700","https://openalex.org/W4405185373"],"related_works":["https://openalex.org/W1534271895","https://openalex.org/W2051024374","https://openalex.org/W2321445466","https://openalex.org/W1978919776","https://openalex.org/W2079759535","https://openalex.org/W3165403372","https://openalex.org/W2031052898","https://openalex.org/W2139969667","https://openalex.org/W2058645934","https://openalex.org/W2032480086"],"abstract_inverted_index":{"Accurate":[0],"retention":[1,77,89],"time":[2,90],"(RT)":[3],"prediction":[4],"in":[5,12,51,79,224,230],"liquid":[6,82,225],"chromatography":[7,83],"remains":[8],"a":[9,23,57,64,108,140,148,218],"significant":[10],"consideration":[11],"molecular":[13,33,112,175],"analysis.":[14,235],"In":[15],"this":[16,52],"study,":[17],"we":[18,182],"explore":[19],"the":[20,184,194,214],"use":[21],"of":[22,66,145,154,160],"transformer-based":[24],"language":[25],"model":[26,216],"to":[27,75,110,136],"predict":[28,76],"RTs":[29],"by":[30],"treating":[31],"simplified":[32],"input":[34],"line":[35],"entry":[36],"system":[37],"(SMILES)":[38],"sequences":[39],"as":[40,114],"textual":[41],"input,":[42],"an":[43],"approach":[44,220],"that":[45,177,213],"has":[46],"not":[47],"been":[48],"previously":[49],"utilized":[50],"field.":[53],"Our":[54,210],"architecture":[55,120],"combines":[56],"pretrained":[58],"RoBERTa":[59],"(robustly":[60],"optimized":[61],"BERT":[62],"approach,":[63],"variant":[65],"BERT)":[67],"with":[68,139,204,227],"bidirectional":[69,129],"long":[70],"short-term":[71],"memory":[72],"(BiLSTM)":[73],"networks":[74],"times":[78],"reversed-phase":[80],"high-performance":[81],"(RP-HPLC).":[84],"The":[85,117,162],"METLIN":[86],"small":[87,96,233],"molecule":[88,234],"(SMRT)":[91],"data":[92,191],"set":[93],"comprising":[94],"77,980":[95],"molecules":[97],"after":[98],"preprocessing,":[99],"was":[100,165],"encoded":[101],"using":[102],"SMILES":[103],"notation":[104],"and":[105,128,156,232],"processed":[106],"through":[107,167],"tokenizer":[109],"enable":[111],"representation":[113],"sequential":[115],"data.":[116],"proposed":[118],"transformer-LSTM":[119],"incorporates":[121],"layer":[122],"fusion":[123],"from":[124,193],"multiple":[125],"transformer":[126],"layers":[127],"sequence":[130],"processing,":[131],"achieving":[132],"superior":[133],"performance":[134,199],"compared":[135],"existing":[137],"methods":[138],"mean":[141,149],"absolute":[142,150],"error":[143,152],"(MAE)":[144],"26.23":[146],"s,":[147],"percentage":[151],"(MAPE)":[153],"3.25%,":[155],"<i>R</i>-squared":[157],"(<i>R</i><sup>2</sup>)":[158],"value":[159],"0.91.":[161],"model's":[163,185],"explainability":[164],"demonstrated":[166],"attention":[168],"visualization,":[169],"revealing":[170],"its":[171],"focus":[172],"on":[173],"key":[174],"features":[176],"can":[178],"influence":[179],"RT.":[180],"Furthermore,":[181],"evaluated":[183],"transfer":[186],"learning":[187],"capabilities":[188],"across":[189,200],"ten":[190],"sets":[192],"PredRet":[195],"database,":[196],"demonstrating":[197],"robust":[198],"different":[201],"chromatographic":[202],"conditions":[203],"consistent":[205],"improvement":[206],"over":[207],"previous":[208],"approaches.":[209],"results":[211],"suggest":[212],"hybrid":[215],"presents":[217],"valuable":[219],"for":[221],"predicting":[222],"RT":[223],"chromatography,":[226],"potential":[228],"applications":[229],"metabolomics":[231]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":4}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
