{"id":"https://openalex.org/W4410541616","doi":"https://doi.org/10.1021/acs.jcim.5c00577","title":"Effective and Explainable Molecular Property Prediction by Chain-of-Thought Enabled Large Language Models and Multi-Modal Molecular Information Fusion","display_name":"Effective and Explainable Molecular Property Prediction by Chain-of-Thought Enabled Large Language Models and Multi-Modal Molecular Information Fusion","publication_year":2025,"publication_date":"2025-05-20","ids":{"openalex":"https://openalex.org/W4410541616","doi":"https://doi.org/10.1021/acs.jcim.5c00577","pmid":"https://pubmed.ncbi.nlm.nih.gov/40392109"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c00577","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00577","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086122487","display_name":"Chang Jin","orcid":"https://orcid.org/0000-0002-0706-0415"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I4390039265","display_name":"PRG S&Tech (South Korea)","ror":"https://ror.org/02sr2ee22","country_code":null,"type":"company","lineage":["https://openalex.org/I4390039265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chang Jin","raw_affiliation_strings":["Department of Computer Science and Technology","Tongji University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology","institution_ids":["https://openalex.org/I4390039265"]},{"raw_affiliation_string":"Tongji University","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064450823","display_name":"Siyuan Guo","orcid":"https://orcid.org/0000-0003-0378-830X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I4390039265","display_name":"PRG S&Tech (South Korea)","ror":"https://ror.org/02sr2ee22","country_code":null,"type":"company","lineage":["https://openalex.org/I4390039265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Guo","raw_affiliation_strings":["Department of Computer Science and Technology","Tongji University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology","institution_ids":["https://openalex.org/I4390039265"]},{"raw_affiliation_string":"Tongji University","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112389497","display_name":"Shuigeng Zhou","orcid":"https://orcid.org/0000-0002-1949-2768"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuigeng Zhou","raw_affiliation_strings":["Fudan University","School of Computer Science"],"affiliations":[{"raw_affiliation_string":"Fudan University","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086316879","display_name":"Jihong Guan","orcid":"https://orcid.org/0000-0003-2313-7635"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I4390039265","display_name":"PRG S&Tech (South Korea)","ror":"https://ror.org/02sr2ee22","country_code":null,"type":"company","lineage":["https://openalex.org/I4390039265"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jihong Guan","raw_affiliation_strings":["Department of Computer Science and Technology","Tongji University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology","institution_ids":["https://openalex.org/I4390039265"]},{"raw_affiliation_string":"Tongji University","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5086316879","https://openalex.org/A5112389497"],"corresponding_institution_ids":["https://openalex.org/I116953780","https://openalex.org/I24943067","https://openalex.org/I4390039265"],"apc_list":null,"apc_paid":null,"fwci":8.6541,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.97774086,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"65","issue":"11","first_page":"5438","last_page":"5455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9585999846458435,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6729714870452881},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.6275835037231445},{"id":"https://openalex.org/keywords/chain","display_name":"Chain (unit)","score":0.5518275499343872},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5354625582695007},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5179373621940613},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.44698452949523926},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41474515199661255},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.23278281092643738},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2077201008796692},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.17108026146888733},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.14831912517547607},{"id":"https://openalex.org/keywords/epistemology","display_name":"Epistemology","score":0.11148667335510254}],"concepts":[{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6729714870452881},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.6275835037231445},{"id":"https://openalex.org/C199185054","wikidata":"https://www.wikidata.org/wiki/Q552299","display_name":"Chain (unit)","level":2,"score":0.5518275499343872},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5354625582695007},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5179373621940613},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44698452949523926},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41474515199661255},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.23278281092643738},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2077201008796692},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.17108026146888733},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.14831912517547607},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.11148667335510254},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000098342","descriptor_name":"Large Language Models","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000098342","descriptor_name":"Large Language Models","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000098342","descriptor_name":"Large Language Models","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.5c00577","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00577","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:40392109","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40392109","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4300000071525574}],"awards":[{"id":"https://openalex.org/G2062780035","display_name":null,"funder_award_id":"62172300","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G245860340","display_name":null,"funder_award_id":"62372326","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W569478347","https://openalex.org/W1545231783","https://openalex.org/W1975147762","https://openalex.org/W1985572431","https://openalex.org/W2064675550","https://openalex.org/W2106983119","https://openalex.org/W2290847742","https://openalex.org/W2585034944","https://openalex.org/W2594183968","https://openalex.org/W2612690371","https://openalex.org/W2741095062","https://openalex.org/W2799054028","https://openalex.org/W2810023675","https://openalex.org/W2896457183","https://openalex.org/W2920835902","https://openalex.org/W2962876364","https://openalex.org/W2964015378","https://openalex.org/W2964113829","https://openalex.org/W2966357564","https://openalex.org/W2968734407","https://openalex.org/W2986232138","https://openalex.org/W3038823641","https://openalex.org/W3094060150","https://openalex.org/W3095602948","https://openalex.org/W3095883070","https://openalex.org/W3100157108","https://openalex.org/W3110901318","https://openalex.org/W3166272013","https://openalex.org/W3168867926","https://openalex.org/W3188589934","https://openalex.org/W3206711231","https://openalex.org/W4210313485","https://openalex.org/W4214868967","https://openalex.org/W4221143046","https://openalex.org/W4287828570","https://openalex.org/W4288407534","https://openalex.org/W4290930066","https://openalex.org/W4292779060","https://openalex.org/W4295846611","https://openalex.org/W4297733535","https://openalex.org/W4300537282","https://openalex.org/W4312632987","https://openalex.org/W4322718191","https://openalex.org/W4380989429","https://openalex.org/W4384616153","https://openalex.org/W4385064217","https://openalex.org/W4386012079","https://openalex.org/W4386614347","https://openalex.org/W4389157347","https://openalex.org/W4389888290","https://openalex.org/W4391272436","https://openalex.org/W4396678548","https://openalex.org/W4400046618","https://openalex.org/W4405254576","https://openalex.org/W4406271402","https://openalex.org/W4406779522"],"related_works":["https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W613940353","https://openalex.org/W2320915480","https://openalex.org/W2582753012","https://openalex.org/W2099421762","https://openalex.org/W2362990116","https://openalex.org/W2381300099","https://openalex.org/W2530546662","https://openalex.org/W2967030268"],"abstract_inverted_index":{"Molecular":[0],"property":[1,64,117,161,220,230],"prediction":[2,118,231],"(MPP)":[3],"plays":[4],"a":[5,150],"critical":[6],"role":[7],"in":[8,115],"drug":[9,131,159],"design":[10,132],"and":[11,25,89,91,133,153,172,192,201,208,241],"discovery.":[12],"Due":[13],"to":[14,59,140,213],"the":[15,43,47,95,184,190,195,247,258,266],"multimodal":[16,29,82,156,216],"nature":[17],"of":[18,49,75,143,176,194,246,260,268],"molecular":[19,27,40,63,76,116,160,169,173,177,217,229],"data":[20,226,249],"(e.g.,":[21],"1D":[22,165],"SMILES":[23,166],"strings":[24],"2D":[26,168],"graphs),":[28],"information":[30,83,98],"fusion":[31],"can":[32],"generally":[33],"achieve":[34],"better":[35],"performance":[36,114,238],"than":[37],"using":[38],"single-modality":[39],"data.":[41,181],"On":[42],"other":[44],"hand,":[45],"with":[46],"rise":[48],"large":[50],"language":[51],"models":[52,104],"(LLMs),":[53],"increasing":[54],"efforts":[55],"have":[56],"been":[57],"made":[58],"leverage":[60],"LLMs":[61],"for":[62,81,108,130,158,219,228],"prediction.":[65,221],"However,":[66],"existing":[67,144,253,269],"works":[68],"usually":[69],"use":[70],"one":[71],"or":[72],"two":[73],"modalities":[74],"data,":[77],"employ":[78],"simple":[79],"techniques":[80],"integration":[84],"such":[85],"as":[86,179],"straightforward":[87],"concatenation":[88],"summation,":[90],"cannot":[92,123],"comprehensively":[93],"exploit":[94],"rich":[96],"complementary":[97],"across":[99,204],"multiple":[100,205],"modalities.":[101,206],"Furthermore,":[102],"these":[103,141],"are":[105,128,211],"typically":[106],"designed":[107],"general":[109],"chemical":[110],"tasks,":[111],"making":[112],"their":[113],"suboptimal.":[119],"Worse":[120],"still,":[121],"they":[122],"provide":[124],"explainable":[125,154],"results,":[126],"which":[127,163],"important":[129],"discovery-related":[134],"tasks":[135],"including":[136],"MPP.":[137],"In":[138],"response":[139],"limitations":[142,267],"works,":[145],"this":[146],"paper":[147],"presents":[148],"LLM-MPP,":[149],"new,":[151],"effective,":[152],"LLM-driven":[155],"method":[157,235],"prediction,":[162],"leverages":[164],"strings,":[167],"graph":[170],"structures,":[171],"textual":[174],"descriptions":[175],"properties":[178],"training":[180],"By":[182],"incorporating":[183],"chain-of-thought":[185],"(CoT)":[186],"technique,":[187],"we":[188],"enhance":[189],"interpretability":[191],"transparency":[193],"proposed":[196],"method,":[197],"while":[198],"promoting":[199],"alignment":[200],"feature":[202],"extraction":[203],"Cross-attention":[207],"contrastive":[209],"learning":[210],"adopted":[212],"effectively":[214,264],"fuse":[215],"representations":[218],"Experiments":[222],"on":[223,239,244],"nine":[224],"benchmark":[225],"sets":[227],"demonstrate":[232],"that":[233],"our":[234,261],"achieves":[236],"state-of-the-art":[237],"5":[240],"ranks":[242],"second":[243],"1":[245],"9":[248],"sets,":[250],"surpassing":[251],"22":[252],"baselines.":[254],"Ablation":[255],"experiments":[256],"validate":[257],"effectiveness":[259],"innovative":[262],"modules,":[263],"addressing":[265],"models.":[270]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4}],"updated_date":"2026-04-06T07:47:59.780226","created_date":"2025-10-10T00:00:00"}
